Downloading the dataset from Google drive

In [1]:
"""
Download all project datasets from Google Drive into data_input/.
"""

import os
from pathlib import Path
import gdown

# Ensure data_input/ exists
DATA_DIR = Path("../../data_input")
DATA_DIR.mkdir(parents=True, exist_ok=True)

# Google Drive FILE IDs for each dataset
FILE_IDS = {
    "cards.csv":             "1O03lb4ZqqMwy3aPeZquAT_OU9ChNyIEM",
    "order_details.csv":     "1u1vsiNpF6saIcG3iDN-R7AiYAFqf9uzq",
    "orders.csv":            "161Rv1xsAevewSnTRFV-9q6FWokgr_-Xt",
    "profiles.csv":          "1bOe2EaMQbrBZyINh9pLMPltDJ2BoNG_D",
    "reviews_labelled.csv":  "1DRYj7r7VnlNyCSMrEHLbwWqj0fodBymV",
    "reviews.csv":           "1kLhalVn5iczHSdp5o3I2PIWCqkOFfpuO",
    "users.csv":             "1K2lycSQXUyMSBx0_NqfuljYzJbW6RzsF",
}

def download_file(file_id: str, filename: str):
    """Download a single file from Google Drive into data_input/."""
    url = f"https://drive.google.com/uc?id={file_id}"
    out_path = DATA_DIR / filename
    print(f"Downloading {filename} ...")
    gdown.download(url, str(out_path), quiet=False)

def main():
    print("ðŸ“¥ Starting dataset download from Google Drive...\n")
    for fname, fid in FILE_IDS.items():
        download_file(fid, fname)
    print("\nâœ… All files downloaded successfully to data_input/")

if __name__ == "__main__":
    main()


ðŸ“¥ Starting dataset download from Google Drive...

Downloading cards.csv ...


Downloading...
From: https://drive.google.com/uc?id=1O03lb4ZqqMwy3aPeZquAT_OU9ChNyIEM
To: c:\Users\Admin\Desktop\DATA SCIENCE\Semester 2\Marketing Analytics\data_input\cards.csv
100%|â–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆ| 44.1M/44.1M [00:02<00:00, 17.5MB/s]


Downloading order_details.csv ...


Downloading...
From (original): https://drive.google.com/uc?id=1u1vsiNpF6saIcG3iDN-R7AiYAFqf9uzq
From (redirected): https://drive.google.com/uc?id=1u1vsiNpF6saIcG3iDN-R7AiYAFqf9uzq&confirm=t&uuid=1ba096e9-a79a-42d5-ae78-d22127633d43
To: c:\Users\Admin\Desktop\DATA SCIENCE\Semester 2\Marketing Analytics\data_input\order_details.csv
100%|â–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆ| 239M/239M [00:12<00:00, 18.5MB/s] 


Downloading orders.csv ...


Downloading...
From (original): https://drive.google.com/uc?id=161Rv1xsAevewSnTRFV-9q6FWokgr_-Xt
From (redirected): https://drive.google.com/uc?id=161Rv1xsAevewSnTRFV-9q6FWokgr_-Xt&confirm=t&uuid=921289d1-60f8-45d5-85b1-a490bafcba31
To: c:\Users\Admin\Desktop\DATA SCIENCE\Semester 2\Marketing Analytics\data_input\orders.csv
100%|â–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆ| 250M/250M [00:13<00:00, 18.1MB/s] 


Downloading profiles.csv ...


Downloading...
From: https://drive.google.com/uc?id=1bOe2EaMQbrBZyINh9pLMPltDJ2BoNG_D
To: c:\Users\Admin\Desktop\DATA SCIENCE\Semester 2\Marketing Analytics\data_input\profiles.csv
100%|â–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆ| 21.4M/21.4M [00:01<00:00, 20.3MB/s]


Downloading reviews_labelled.csv ...


Downloading...
From (original): https://drive.google.com/uc?id=1DRYj7r7VnlNyCSMrEHLbwWqj0fodBymV
From (redirected): https://drive.google.com/uc?id=1DRYj7r7VnlNyCSMrEHLbwWqj0fodBymV&confirm=t&uuid=32d2b54e-38cb-4975-8118-ae5603b7f72e
To: c:\Users\Admin\Desktop\DATA SCIENCE\Semester 2\Marketing Analytics\data_input\reviews_labelled.csv
100%|â–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆ| 212M/212M [00:11<00:00, 18.4MB/s] 


Downloading reviews.csv ...


Downloading...
From: https://drive.google.com/uc?id=1kLhalVn5iczHSdp5o3I2PIWCqkOFfpuO
To: c:\Users\Admin\Desktop\DATA SCIENCE\Semester 2\Marketing Analytics\data_input\reviews.csv
100%|â–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆ| 51.0M/51.0M [00:02<00:00, 19.8MB/s]


Downloading users.csv ...


Downloading...
From: https://drive.google.com/uc?id=1K2lycSQXUyMSBx0_NqfuljYzJbW6RzsF
To: c:\Users\Admin\Desktop\DATA SCIENCE\Semester 2\Marketing Analytics\data_input\users.csv
100%|â–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆâ–ˆ| 69.2M/69.2M [00:03<00:00, 19.7MB/s]


âœ… All files downloaded successfully to data_input/



