In [26]:
import numpy as np
import pandas as pd

In [27]:
"""
Native Python dates and times
"""

from datetime import datetime

t = datetime(year=2021, month=10, day=28)
print(t)

# Build a date using the datetime type

2021-10-28 00:00:00


In [28]:
# Purse a date from a string

from dateutil import parser
date = parser.parse("28th of October, 2021")
print(date)

2021-10-28 00:00:00


In [29]:
# Print the day of the week

date.strftime('%A')

'Thursday'

In [31]:
"""
Types Arrays of Times: Numpy's datetime64
"""

# Create datetime64 using array()
date = np.array(['2021-10-27', '2021-10-28'], dtype=np.datetime64)
type(date[0])

# Use datetune64()
date = np.datetime64('2021-10-27')
print(date)

2021-10-27


In [34]:
# We can quickly do vectorized operations on datetime64

date + np.arange(12)

array(['2021-10-27', '2021-10-28', '2021-10-29', '2021-10-30',
       '2021-10-31', '2021-11-01', '2021-11-02', '2021-11-03',
       '2021-11-04', '2021-11-05', '2021-11-06', '2021-11-07'],
      dtype='datetime64[D]')

In [40]:
# Minite-based datetime

date = np.datetime64('2021-10-28 10:11:30')
print(date)

2021-10-28T10:11:30


In [41]:
# Nnosecond-based datetime

date = np.datetime64('2021-10-28 10:11:30', 'ns')
print(date)

2021-10-28T10:11:30.000000000


In [47]:
"""
Dates and Times in Pandas
"""

# Parse a string date in pandas

date = pd.to_datetime("27th of October, 2021")
print(date)
print(type(date))

2021-10-27 00:00:00
<class 'pandas._libs.tslibs.timestamps.Timestamp'>


In [46]:
# Output the day of the week

print(date.strftime('%A'))

Wednesday


In [48]:
# NumPy-style vectorized operations

date + pd.to_timedelta(np.arange(12))

DatetimeIndex([          '2021-10-27 00:00:00',
               '2021-10-27 00:00:00.000000001',
               '2021-10-27 00:00:00.000000002',
               '2021-10-27 00:00:00.000000003',
               '2021-10-27 00:00:00.000000004',
               '2021-10-27 00:00:00.000000005',
               '2021-10-27 00:00:00.000000006',
               '2021-10-27 00:00:00.000000007',
               '2021-10-27 00:00:00.000000008',
               '2021-10-27 00:00:00.000000009',
               '2021-10-27 00:00:00.000000010',
               '2021-10-27 00:00:00.000000011'],
              dtype='datetime64[ns]', freq=None)

In [53]:
"""
Pandas Time Series: Indexing by Time
"""

# Indexing by timestamps
ind = pd.DatetimeIndex(['2021-10-27', '2021-10-28', '2021-10-29', '2021-10-30',
                       '2021-10-31', '2021-11-01', '2021-11-02'])
print(ind)

ser = pd.Series([0, 1, 2, 3, 4, 5, 6], index=ind)
print(ser)

DatetimeIndex(['2021-10-27', '2021-10-28', '2021-10-29', '2021-10-30',
               '2021-10-31', '2021-11-01', '2021-11-02'],
              dtype='datetime64[ns]', freq=None)
2021-10-27    0
2021-10-28    1
2021-10-29    2
2021-10-30    3
2021-10-31    4
2021-11-01    5
2021-11-02    6
dtype: int64


In [56]:
# Indexing patterns

print(ser['2021-10-27':'2021-10-31'], '\n')

print(ser['2021-11'])

2021-10-27    0
2021-10-28    1
2021-10-29    2
2021-10-30    3
2021-10-31    4
dtype: int64 

2021-11-01    5
2021-11-02    6
dtype: int64


In [60]:
"""
Pandas Time Series Data Structures
"""

# Timestamp and DatetimeIndex

dates = pd.to_datetime([datetime(2015, 7, 3),
                       "4th of July, 2015",
                       '2015-Jul-6',
                       '07-07-2015',
                       '20150708'])
print(dates)

DatetimeIndex(['2015-07-03', '2015-07-04', '2015-07-06', '2015-07-07',
               '2015-07-08'],
              dtype='datetime64[ns]', freq=None)


In [62]:
# DatetimeIndex -> PeriodIndex with to_period()

dates.to_period('D')
dates.to_period('W')

PeriodIndex(['2015-06-29/2015-07-05', '2015-06-29/2015-07-05',
             '2015-07-06/2015-07-12', '2015-07-06/2015-07-12',
             '2015-07-06/2015-07-12'],
            dtype='period[W-SUN]', freq='W-SUN')

In [63]:
# TimedeltaIndex

dates - dates[0]

TimedeltaIndex(['0 days', '1 days', '3 days', '4 days', '5 days'], dtype='timedelta64[ns]', freq=None)

In [66]:
"""
Regular Sequences
"""

# pd.date_range(), default freq: day

pd.date_range('2021-10-27', '2021-10-31')

DatetimeIndex(['2021-10-27', '2021-10-28', '2021-10-29', '2021-10-30',
               '2021-10-31'],
              dtype='datetime64[ns]', freq='D')

In [67]:
# Use startpoint and nym, of periods

pd.date_range('2021-10-27', periods=5)

DatetimeIndex(['2021-10-27', '2021-10-28', '2021-10-29', '2021-10-30',
               '2021-10-31'],
              dtype='datetime64[ns]', freq='D')

In [69]:
# Change the frequency

pd.date_range('2021-10-27', periods=12, freq='H')

DatetimeIndex(['2021-10-27 00:00:00', '2021-10-27 01:00:00',
               '2021-10-27 02:00:00', '2021-10-27 03:00:00',
               '2021-10-27 04:00:00', '2021-10-27 05:00:00',
               '2021-10-27 06:00:00', '2021-10-27 07:00:00',
               '2021-10-27 08:00:00', '2021-10-27 09:00:00',
               '2021-10-27 10:00:00', '2021-10-27 11:00:00'],
              dtype='datetime64[ns]', freq='H')

In [70]:
# pd.period_range()

pd.period_range('2021-10', periods=12, freq='M')

PeriodIndex(['2021-10', '2021-11', '2021-12', '2022-01', '2022-02', '2022-03',
             '2022-04', '2022-05', '2022-06', '2022-07', '2022-08', '2022-09'],
            dtype='period[M]', freq='M')

In [71]:
pd.timedelta_range(0, periods=10, freq='H')

TimedeltaIndex(['00:00:00', '01:00:00', '02:00:00', '03:00:00', '04:00:00',
                '05:00:00', '06:00:00', '07:00:00', '08:00:00', '09:00:00'],
               dtype='timedelta64[ns]', freq='H')