# Part 1: Using wget

In [None]:
# download the data from a URL
# source: https://archive.ics.uci.edu/ml/datasets/Arrhythmia
# alternate URL: https://lazyprogrammer.me/course_files/arrhythmia.data
#!wget --no-check-certificate https://archive.ics.uci.edu/ml/machine-learning-databases/arrhythmia/arrhythmia.data
!wget https://lazyprogrammer.me/course_files/arrhythmia.data

In [None]:
# list files in current directory
!ls

In [None]:
# check if the data has a header
!head arrhythmia.data

In [None]:
# check the data
import pandas as pd
df = pd.read_csv('arrhythmia.data', header=None)

In [None]:
# since the data has many columns, take just the first few and name them (as per the documentation)
data = df[[0,1,2,3,4,5]]
data.columns = ['age', 'sex', 'height', 'weight', 'QRS duration', 'P-R interval']

In [None]:
import matplotlib.pyplot as plt
plt.rcParams['figure.figsize'] = [15, 15] # make the plot bigger so the subplots don't overlap
data.hist(); # use a semicolon to supress return value

In [None]:
from pandas.plotting import scatter_matrix
scatter_matrix(data);

# Part 2: Using tf.keras

In [None]:
# use keras get_file to download the auto MPG dataset
# source: https://archive.ics.uci.edu/ml/datasets/Auto+MPG
#url = 'https://archive.ics.uci.edu/ml/machine-learning-databases/auto-mpg/auto-mpg.data'

### alternate URL
url = 'https://raw.githubusercontent.com/lazyprogrammer/machine_learning_examples/master/tf2.0/auto-mpg.data'


In [None]:
# check out the documentation for other arguments
tf.keras.utils.get_file('auto-mpg.data', url)

In [None]:
!head /root/.keras/datasets/auto-mpg.data

In [None]:
# unless you specify an alternative path, the data will go into /root/.keras/datasets/
df = pd.read_csv('/root/.keras/datasets/auto-mpg.data', header=None, delim_whitespace=True)
df.head()

# Part 3: Upload the file yourself

In [None]:
from google.colab import files
uploaded = files.upload()

In [None]:
uploaded

In [None]:
# file is uploaded to the current directory
!ls

In [None]:
# open the file
# the last few lines are junk
df = pd.read_csv('daily-minimum-temperatures-in-me.csv', error_bad_lines=False)
df.head()

In [None]:
# upload a Python file with some useful functions (meant for fake_util.py)
from google.colab import files
uploaded = files.upload()

In [None]:
from fake_util import my_useful_function
my_useful_function()

In [None]:
!pwd

# Part 4: Access files from Google Drive

In [None]:
# Access files from your Google Drive
from google.colab import drive
drive.mount('/content/gdrive')

In [None]:
# Check current directory - now gdrive is there
!ls

In [None]:
# What's in gdrive?
!ls gdrive

In [None]:
# Whoa! Look at all this great VIP content!
!ls '/content/gdrive/My Drive/'