# Importing Libraries

In [6]:
import requests
import json
import pandas as pd
from datetime import datetime

# GitHub API endpoint

In [7]:
# GitHub API endpoint
api_url = "https://api.github.com/search/repositories"

# Trending topics

In [8]:
# Trending topics
trending_topics = [
    "machine learning",
    "data visualization",
    "deep learning",
    "natural language processing",
    "data engineering",
    "data science",
    "python",
    "sql",
    "cloud computing",
    "big data"
]


# Function to fetch repository data

In [9]:
# Function to fetch repository data
def fetch_repository_data(topic):
    params = {
        "q": f"topic:{topic}",
        "sort": "stars",
        "per_page": 100
    }

    response = requests.get(api_url, params=params)
    data = response.json()["items"]

    repository_data = []
    for item in data:
        repository_data.append({
            "Topic":topic,
            "Repository_Name": item["name"],
            "Owner": item["owner"]["login"],
            "Description": item["description"],
            "URL": item["html_url"],
            "Programming_Language": item["language"],
            "Creation_Date": item["created_at"],
            "Last_Updated_Date": item["updated_at"],
            "Number_of_Stars": item["stargazers_count"],
            "Number_of_Forks": item["forks_count"],
            "Number_of_Open_Issues": item["open_issues_count"],
            "License_Type": item["license"]["name"] if item["license"] else "Unknown"
        })

    return repository_data

## Breakdown of function

## EX Topic

In [10]:
topic="machine learning"

## Parameters to fetch data

In [11]:
#Parameters
params = {
    "q": f"topic:{topic}",
    "sort": "stars",
    "per_page": 50
}
params

{'q': 'topic:machine learning', 'sort': 'stars', 'per_page': 50}

## Getting the response 

In [12]:

response = requests.get(api_url, params=params)
data = response.json()["items"]


## Fetched Data 

In [13]:
data

[{'id': 87536046,
  'node_id': 'MDEwOlJlcG9zaXRvcnk4NzUzNjA0Ng==',
  'name': 'mit-deep-learning-book-pdf',
  'full_name': 'janishar/mit-deep-learning-book-pdf',
  'private': False,
  'owner': {'login': 'janishar',
   'id': 11065002,
   'node_id': 'MDQ6VXNlcjExMDY1MDAy',
   'avatar_url': 'https://avatars.githubusercontent.com/u/11065002?v=4',
   'gravatar_id': '',
   'url': 'https://api.github.com/users/janishar',
   'html_url': 'https://github.com/janishar',
   'followers_url': 'https://api.github.com/users/janishar/followers',
   'following_url': 'https://api.github.com/users/janishar/following{/other_user}',
   'gists_url': 'https://api.github.com/users/janishar/gists{/gist_id}',
   'starred_url': 'https://api.github.com/users/janishar/starred{/owner}{/repo}',
   'subscriptions_url': 'https://api.github.com/users/janishar/subscriptions',
   'organizations_url': 'https://api.github.com/users/janishar/orgs',
   'repos_url': 'https://api.github.com/users/janishar/repos',
   'events_url'

## Data Extraction

In [14]:

repository_data = []
for item in data:
    repository_data.append({
        "Topic":topic,
        "Repository_Name": item["name"],
        "Owner": item["owner"]["login"],
        "Description": item["description"],
        "URL": item["html_url"],
        "Programming_Language": item["language"],
        "Creation_Date": item["created_at"],
        "Last_Updated_Date": item["updated_at"],
        "Number_of_Stars": item["stargazers_count"],
        "Number_of_Forks": item["forks_count"],
        "Number_of_Open_Issues": item["open_issues_count"],
        "License_Type": item["license"]["name"] if item["license"] else "Unknown"
    })

In [15]:

repository_data

[{'Topic': 'machine learning',
  'Repository_Name': 'mit-deep-learning-book-pdf',
  'Owner': 'janishar',
  'Description': 'MIT Deep Learning Book in PDF format (complete and parts) by Ian Goodfellow, Yoshua Bengio and Aaron Courville',
  'URL': 'https://github.com/janishar/mit-deep-learning-book-pdf',
  'Programming_Language': 'Java',
  'Creation_Date': '2017-04-07T10:46:50Z',
  'Last_Updated_Date': '2024-10-06T04:30:47Z',
  'Number_of_Stars': 12783,
  'Number_of_Forks': 2699,
  'Number_of_Open_Issues': 12,
  'License_Type': 'Unknown'},
 {'Topic': 'machine learning',
  'Repository_Name': 'machine-learning-mindmap',
  'Owner': 'dformoso',
  'Description': 'A mindmap summarising Machine Learning concepts, from Data Analysis to Deep Learning.',
  'URL': 'https://github.com/dformoso/machine-learning-mindmap',
  'Programming_Language': None,
  'Creation_Date': '2017-08-10T04:29:24Z',
  'Last_Updated_Date': '2024-10-05T15:14:52Z',
  'Number_of_Stars': 6114,
  'Number_of_Forks': 1005,
  'Numb

## DataFrame Conversion 

In [16]:
repo_df = pd.DataFrame(repository_data)
repo_df

Unnamed: 0,Topic,Repository_Name,Owner,Description,URL,Programming_Language,Creation_Date,Last_Updated_Date,Number_of_Stars,Number_of_Forks,Number_of_Open_Issues,License_Type
0,machine learning,mit-deep-learning-book-pdf,janishar,MIT Deep Learning Book in PDF format (complete...,https://github.com/janishar/mit-deep-learning-...,Java,2017-04-07T10:46:50Z,2024-10-06T04:30:47Z,12783,2699,12,Unknown
1,machine learning,machine-learning-mindmap,dformoso,A mindmap summarising Machine Learning concept...,https://github.com/dformoso/machine-learning-m...,,2017-08-10T04:29:24Z,2024-10-05T15:14:52Z,6114,1005,4,Apache License 2.0
2,machine learning,rapping-neural-network,robbiebarrat,Rap song writing recurrent neural network trai...,https://github.com/robbiebarrat/rapping-neural...,Python,2016-11-03T22:39:49Z,2024-10-02T09:01:24Z,1043,167,14,Unknown
3,machine learning,awesome-machine-learning,onmyway133,🎰 A curated list of machine learning resources...,https://github.com/onmyway133/awesome-machine-...,,2017-06-10T16:05:45Z,2024-10-02T04:41:22Z,807,106,2,MIT License
4,machine learning,DeepJ,calclavia,A deep learning model for style-specific music...,https://github.com/calclavia/DeepJ,Python,2017-01-15T06:43:17Z,2024-09-25T05:00:44Z,725,110,16,MIT License
5,machine learning,HungaBunga,ypeleg,HungaBunga: Brute-Force all sklearn models wit...,https://github.com/ypeleg/HungaBunga,Python,2019-08-20T11:26:09Z,2024-09-11T03:23:32Z,710,79,14,MIT License
6,machine learning,practical-mlops-book,paiml,[Book-2021] Practical MLOps O'Reilly Book,https://github.com/paiml/practical-mlops-book,Jupyter Notebook,2020-11-08T13:30:47Z,2024-10-02T19:37:31Z,706,284,2,Unknown
7,machine learning,sklearn-classification,dformoso,Data Science Notebook on a Classification Task...,https://github.com/dformoso/sklearn-classifica...,Jupyter Notebook,2017-08-12T05:05:33Z,2024-10-05T04:34:20Z,690,232,7,GNU General Public License v3.0
8,machine learning,neptune-client,neptune-ai,📘 The experiment tracker for foundation model ...,https://github.com/neptune-ai/neptune-client,Python,2019-02-11T11:25:57Z,2024-10-05T12:04:01Z,576,63,30,Apache License 2.0
9,machine learning,moviebox,klaudiosinani,Machine learning movie recommending system,https://github.com/klaudiosinani/moviebox,Python,2018-01-23T20:37:19Z,2024-09-23T14:20:54Z,524,55,4,MIT License


## For every Topics

In [18]:
repository_data = []
for topic in trending_topics:
    data = fetch_repository_data(topic)
    repository_data.extend(data)

In [19]:
repository_data

[{'Topic': 'machine learning',
  'Repository_Name': 'mit-deep-learning-book-pdf',
  'Owner': 'janishar',
  'Description': 'MIT Deep Learning Book in PDF format (complete and parts) by Ian Goodfellow, Yoshua Bengio and Aaron Courville',
  'URL': 'https://github.com/janishar/mit-deep-learning-book-pdf',
  'Programming_Language': 'Java',
  'Creation_Date': '2017-04-07T10:46:50Z',
  'Last_Updated_Date': '2024-10-06T04:30:47Z',
  'Number_of_Stars': 12783,
  'Number_of_Forks': 2699,
  'Number_of_Open_Issues': 12,
  'License_Type': 'Unknown'},
 {'Topic': 'machine learning',
  'Repository_Name': 'machine-learning-mindmap',
  'Owner': 'dformoso',
  'Description': 'A mindmap summarising Machine Learning concepts, from Data Analysis to Deep Learning.',
  'URL': 'https://github.com/dformoso/machine-learning-mindmap',
  'Programming_Language': None,
  'Creation_Date': '2017-08-10T04:29:24Z',
  'Last_Updated_Date': '2024-10-05T15:14:52Z',
  'Number_of_Stars': 6114,
  'Number_of_Forks': 1005,
  'Numb

In [20]:
repo_df = pd.DataFrame(repository_data)
repo_df

Unnamed: 0,Topic,Repository_Name,Owner,Description,URL,Programming_Language,Creation_Date,Last_Updated_Date,Number_of_Stars,Number_of_Forks,Number_of_Open_Issues,License_Type
0,machine learning,mit-deep-learning-book-pdf,janishar,MIT Deep Learning Book in PDF format (complete...,https://github.com/janishar/mit-deep-learning-...,Java,2017-04-07T10:46:50Z,2024-10-06T04:30:47Z,12783,2699,12,Unknown
1,machine learning,machine-learning-mindmap,dformoso,A mindmap summarising Machine Learning concept...,https://github.com/dformoso/machine-learning-m...,,2017-08-10T04:29:24Z,2024-10-05T15:14:52Z,6114,1005,4,Apache License 2.0
2,machine learning,rapping-neural-network,robbiebarrat,Rap song writing recurrent neural network trai...,https://github.com/robbiebarrat/rapping-neural...,Python,2016-11-03T22:39:49Z,2024-10-02T09:01:24Z,1043,167,14,Unknown
3,machine learning,awesome-machine-learning,onmyway133,🎰 A curated list of machine learning resources...,https://github.com/onmyway133/awesome-machine-...,,2017-06-10T16:05:45Z,2024-10-02T04:41:22Z,807,106,2,MIT License
4,machine learning,DeepJ,calclavia,A deep learning model for style-specific music...,https://github.com/calclavia/DeepJ,Python,2017-01-15T06:43:17Z,2024-09-25T05:00:44Z,725,110,16,MIT License
...,...,...,...,...,...,...,...,...,...,...,...,...
876,big data,FacebookGlobalCities,riquedev,"Obtenha ID, Nome, Latitude, Longitude de deter...",https://github.com/riquedev/FacebookGlobalCities,PHP,2017-08-12T11:42:47Z,2017-08-12T12:50:13Z,0,0,0,MIT License
877,big data,NOAA_GHCND,glider4,Conversion and ingestion of NOAA GHCN-D weathe...,https://github.com/glider4/NOAA_GHCND,Python,2020-02-15T03:44:41Z,2021-02-01T02:07:24Z,0,1,0,GNU General Public License v3.0
878,big data,DSA_leetcode,tinyHiker,This directory hold my work on data structure...,https://github.com/tinyHiker/DSA_leetcode,Python,2024-01-24T23:21:25Z,2024-01-25T00:42:23Z,0,0,0,Unknown
879,big data,Search-engine---English-Wikipedia,noama11,Search engine for Wikipedia's 6.3M+ documents....,https://github.com/noama11/Search-engine---Eng...,Python,2024-02-23T09:05:18Z,2024-08-17T17:08:29Z,0,0,0,Unknown


In [21]:
# Function to fetch repository data
def fetch_repository_data(topic):
    params = {
        "q": f"topic:{topic}",
        "sort": "stars",
        "per_page": 100
    }

    response = requests.get(api_url, params=params)
    data = response.json()["items"]

    repository_data = []
    for item in data:
        repository_data.append({
            "Topic":topic,
            "Repository_Name": item["name"],
            "Owner": item["owner"]["login"],
            "Description": item["description"],
            "URL": item["html_url"],
            "Programming_Language": item["language"],
            "Creation_Date": item["created_at"],
            "Last_Updated_Date": item["updated_at"],
            "Number_of_Stars": item["stargazers_count"],
            "Number_of_Forks": item["forks_count"],
            "Number_of_Open_Issues": item["open_issues_count"],
            "License_Type": item["license"]["name"] if item["license"] else "Unknown"
        })

    return repository_data

repository_data = []
for topic in trending_topics:
    data = fetch_repository_data(topic)
    repository_data.extend(data)


repo_df = pd.DataFrame(repository_data)

In [22]:
repo_df

Unnamed: 0,Topic,Repository_Name,Owner,Description,URL,Programming_Language,Creation_Date,Last_Updated_Date,Number_of_Stars,Number_of_Forks,Number_of_Open_Issues,License_Type
0,machine learning,mit-deep-learning-book-pdf,janishar,MIT Deep Learning Book in PDF format (complete...,https://github.com/janishar/mit-deep-learning-...,Java,2017-04-07T10:46:50Z,2024-10-06T04:30:47Z,12783,2699,12,Unknown
1,machine learning,machine-learning-mindmap,dformoso,A mindmap summarising Machine Learning concept...,https://github.com/dformoso/machine-learning-m...,,2017-08-10T04:29:24Z,2024-10-05T15:14:52Z,6114,1005,4,Apache License 2.0
2,machine learning,rapping-neural-network,robbiebarrat,Rap song writing recurrent neural network trai...,https://github.com/robbiebarrat/rapping-neural...,Python,2016-11-03T22:39:49Z,2024-10-02T09:01:24Z,1043,167,14,Unknown
3,machine learning,awesome-machine-learning,onmyway133,🎰 A curated list of machine learning resources...,https://github.com/onmyway133/awesome-machine-...,,2017-06-10T16:05:45Z,2024-10-02T04:41:22Z,807,106,2,MIT License
4,machine learning,DeepJ,calclavia,A deep learning model for style-specific music...,https://github.com/calclavia/DeepJ,Python,2017-01-15T06:43:17Z,2024-09-25T05:00:44Z,725,110,16,MIT License
...,...,...,...,...,...,...,...,...,...,...,...,...
876,big data,FacebookGlobalCities,riquedev,"Obtenha ID, Nome, Latitude, Longitude de deter...",https://github.com/riquedev/FacebookGlobalCities,PHP,2017-08-12T11:42:47Z,2017-08-12T12:50:13Z,0,0,0,MIT License
877,big data,NOAA_GHCND,glider4,Conversion and ingestion of NOAA GHCN-D weathe...,https://github.com/glider4/NOAA_GHCND,Python,2020-02-15T03:44:41Z,2021-02-01T02:07:24Z,0,1,0,GNU General Public License v3.0
878,big data,DSA_leetcode,tinyHiker,This directory hold my work on data structure...,https://github.com/tinyHiker/DSA_leetcode,Python,2024-01-24T23:21:25Z,2024-01-25T00:42:23Z,0,0,0,Unknown
879,big data,Search-engine---English-Wikipedia,noama11,Search engine for Wikipedia's 6.3M+ documents....,https://github.com/noama11/Search-engine---Eng...,Python,2024-02-23T09:05:18Z,2024-08-17T17:08:29Z,0,0,0,Unknown


In [24]:
repo_df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 881 entries, 0 to 880
Data columns (total 12 columns):
 #   Column                 Non-Null Count  Dtype 
---  ------                 --------------  ----- 
 0   Topic                  881 non-null    object
 1   Repository_Name        881 non-null    object
 2   Owner                  881 non-null    object
 3   Description            866 non-null    object
 4   URL                    881 non-null    object
 5   Programming_Language   783 non-null    object
 6   Creation_Date          881 non-null    object
 7   Last_Updated_Date      881 non-null    object
 8   Number_of_Stars        881 non-null    int64 
 9   Number_of_Forks        881 non-null    int64 
 10  Number_of_Open_Issues  881 non-null    int64 
 11  License_Type           881 non-null    object
dtypes: int64(3), object(9)
memory usage: 82.7+ KB


In [27]:
# Find rows where 'Description' column has NaN values
null_rows = repo_df[repo_df['Description'].isnull()]

# Display the rows with null values in the 'Description' column
print(null_rows)


                           Topic  \
58              machine learning   
77              machine learning   
143           data visualization   
186           data visualization   
267                deep learning   
280                deep learning   
294                deep learning   
296                deep learning   
322  natural language processing   
328  natural language processing   
420             data engineering   
856                     big data   
859                     big data   
865                     big data   
875                     big data   

                                  Repository_Name             Owner  \
58                          Credit-Risk-Modelling        RegaipKURT   
77                                    algorithmia    snlpatel001213   
143                                    HistoryMap         Vis4Sense   
186                      Python-for-data-analysis       buomsoo-kim   
267                           DeepAndCrossNetwork           barkain 

In [26]:
# Count the number of null rows in the 'Description' column
null_count = repo_df['Description'].isnull().sum()
null_count


15

# Data Cleaning:

In [35]:

# 1. Fill Missing Values
# 'Programming Language' might have missing values, fill with 'Unknown'
repo_df['Programming_Language'].fillna('Unknown', inplace=True)

# 'License Type' might be missing if no license is provided, fill with 'None'
repo_df['License_Type'].fillna('None', inplace=True)

# 'Description' might be missing if no Description is provided, fill with 'None'
repo_df['Description'].fillna('None', inplace=True)

# 2. Convert Dates to datetime format
repo_df['Creation_Date'] = pd.to_datetime(repo_df['Creation_Date']).dt.date
repo_df['Last_Updated_Date'] = pd.to_datetime(repo_df['Last_Updated_Date']).dt.date

# 3. Handle Duplicates (if any)
# Ensure that repositories are unique based on the repository name and owner
repo_df.drop_duplicates(subset=['Repository_Name', 'Owner'], inplace=True)

# 4. Ensure Data Consistency (Standardizing formats)
# Convert all text fields to lowercase for consistency
repo_df['Repository_Name'] = repo_df['Repository_Name'].str.lower()
repo_df['Owner'] = repo_df['Owner'].str.lower()
repo_df['Programming_Language'] = repo_df['Programming_Language'].str.lower()
repo_df['License_Type'] = repo_df['License_Type'].str.lower()

# 5. Change index name to 'ID' and start from 1
repo_df.index = repo_df.index + 1 
repo_df.index.name = 'ID'  


repo_df


The behavior will change in pandas 3.0. This inplace method will never work because the intermediate object on which we are setting values always behaves as a copy.

For example, when doing 'df[col].method(value, inplace=True)', try using 'df.method({col: value}, inplace=True)' or df[col] = df[col].method(value) instead, to perform the operation inplace on the original object.


  repo_df['Programming_Language'].fillna('Unknown', inplace=True)
The behavior will change in pandas 3.0. This inplace method will never work because the intermediate object on which we are setting values always behaves as a copy.

For example, when doing 'df[col].method(value, inplace=True)', try using 'df.method({col: value}, inplace=True)' or df[col] = df[col].method(value) instead, to perform the operation inplace on the original object.


  repo_df['License_Type'].fillna('None', inplace=True)
The behavior will change in pandas 3.0. This inplace method will never work because the intermediate object on whic

Unnamed: 0_level_0,Topic,Repository_Name,Owner,Description,URL,Programming_Language,Creation_Date,Last_Updated_Date,Number_of_Stars,Number_of_Forks,Number_of_Open_Issues,License_Type
ID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
1,machine learning,mit-deep-learning-book-pdf,janishar,MIT Deep Learning Book in PDF format (complete...,https://github.com/janishar/mit-deep-learning-...,java,2017-04-07,2024-10-06,12783,2699,12,unknown
2,machine learning,machine-learning-mindmap,dformoso,A mindmap summarising Machine Learning concept...,https://github.com/dformoso/machine-learning-m...,unknown,2017-08-10,2024-10-05,6114,1005,4,apache license 2.0
3,machine learning,rapping-neural-network,robbiebarrat,Rap song writing recurrent neural network trai...,https://github.com/robbiebarrat/rapping-neural...,python,2016-11-03,2024-10-02,1043,167,14,unknown
4,machine learning,awesome-machine-learning,onmyway133,🎰 A curated list of machine learning resources...,https://github.com/onmyway133/awesome-machine-...,unknown,2017-06-10,2024-10-02,807,106,2,mit license
5,machine learning,deepj,calclavia,A deep learning model for style-specific music...,https://github.com/calclavia/DeepJ,python,2017-01-15,2024-09-25,725,110,16,mit license
...,...,...,...,...,...,...,...,...,...,...,...,...
877,big data,facebookglobalcities,riquedev,"Obtenha ID, Nome, Latitude, Longitude de deter...",https://github.com/riquedev/FacebookGlobalCities,php,2017-08-12,2017-08-12,0,0,0,mit license
878,big data,noaa_ghcnd,glider4,Conversion and ingestion of NOAA GHCN-D weathe...,https://github.com/glider4/NOAA_GHCND,python,2020-02-15,2021-02-01,0,1,0,gnu general public license v3.0
879,big data,dsa_leetcode,tinyhiker,This directory hold my work on data structure...,https://github.com/tinyHiker/DSA_leetcode,python,2024-01-24,2024-01-25,0,0,0,unknown
880,big data,search-engine---english-wikipedia,noama11,Search engine for Wikipedia's 6.3M+ documents....,https://github.com/noama11/Search-engine---Eng...,python,2024-02-23,2024-08-17,0,0,0,unknown


In [37]:
repo_df.info()

<class 'pandas.core.frame.DataFrame'>
Index: 857 entries, 1 to 881
Data columns (total 12 columns):
 #   Column                 Non-Null Count  Dtype 
---  ------                 --------------  ----- 
 0   Topic                  857 non-null    object
 1   Repository_Name        857 non-null    object
 2   Owner                  857 non-null    object
 3   Description            857 non-null    object
 4   URL                    857 non-null    object
 5   Programming_Language   857 non-null    object
 6   Creation_Date          857 non-null    object
 7   Last_Updated_Date      857 non-null    object
 8   Number_of_Stars        857 non-null    int64 
 9   Number_of_Forks        857 non-null    int64 
 10  Number_of_Open_Issues  857 non-null    int64 
 11  License_Type           857 non-null    object
dtypes: int64(3), object(9)
memory usage: 87.0+ KB


# Data Storage

In [38]:
from sqlalchemy import create_engine

In [62]:

# Replace with your PostgreSQL database connection details
# Format: 'postgresql+psycopg2://username:password@host:port/db_name'
username='postgres'
password='Ajay'

engine = create_engine('postgresql+psycopg2://postgres:Ajay@localhost:5432/github_data')
#con=engine.connect


# Save the DataFrame to the PostgreSQL database, overwrites the table if it exists
repo_df.to_sql('repositories', con=engine, if_exists='replace', index=False)



857

# Data Retrival

In [63]:
engine = create_engine('postgresql+psycopg2://postgres:Ajay@localhost:5432/github_data')

# Load data from the PostgreSQL database
def load_data():
    query = "SELECT * FROM public.repositories;"
    df = pd.read_sql(query, engine)
    return df


In [64]:
data=load_data()
data

Unnamed: 0,Topic,Repository_Name,Owner,Description,URL,Programming_Language,Creation_Date,Last_Updated_Date,Number_of_Stars,Number_of_Forks,Number_of_Open_Issues,License_Type
0,machine learning,mit-deep-learning-book-pdf,janishar,MIT Deep Learning Book in PDF format (complete...,https://github.com/janishar/mit-deep-learning-...,java,2017-04-07,2024-10-06,12783,2699,12,unknown
1,machine learning,machine-learning-mindmap,dformoso,A mindmap summarising Machine Learning concept...,https://github.com/dformoso/machine-learning-m...,unknown,2017-08-10,2024-10-05,6114,1005,4,apache license 2.0
2,machine learning,rapping-neural-network,robbiebarrat,Rap song writing recurrent neural network trai...,https://github.com/robbiebarrat/rapping-neural...,python,2016-11-03,2024-10-02,1043,167,14,unknown
3,machine learning,awesome-machine-learning,onmyway133,🎰 A curated list of machine learning resources...,https://github.com/onmyway133/awesome-machine-...,unknown,2017-06-10,2024-10-02,807,106,2,mit license
4,machine learning,deepj,calclavia,A deep learning model for style-specific music...,https://github.com/calclavia/DeepJ,python,2017-01-15,2024-09-25,725,110,16,mit license
...,...,...,...,...,...,...,...,...,...,...,...,...
852,big data,facebookglobalcities,riquedev,"Obtenha ID, Nome, Latitude, Longitude de deter...",https://github.com/riquedev/FacebookGlobalCities,php,2017-08-12,2017-08-12,0,0,0,mit license
853,big data,noaa_ghcnd,glider4,Conversion and ingestion of NOAA GHCN-D weathe...,https://github.com/glider4/NOAA_GHCND,python,2020-02-15,2021-02-01,0,1,0,gnu general public license v3.0
854,big data,dsa_leetcode,tinyhiker,This directory hold my work on data structure...,https://github.com/tinyHiker/DSA_leetcode,python,2024-01-24,2024-01-25,0,0,0,unknown
855,big data,search-engine---english-wikipedia,noama11,Search engine for Wikipedia's 6.3M+ documents....,https://github.com/noama11/Search-engine---Eng...,python,2024-02-23,2024-08-17,0,0,0,unknown


In [66]:
pip freeze > requirments.txt

Note: you may need to restart the kernel to use updated packages.


