# Reading & visualizaing raw data, cropping, filtering, and saving

## Import the few packages we'll need

In [1]:
import matplotlib
import pathlib
import mne

Ensure Matplotlib uses the `Qt5Agg` backend, which is the best choice for MNE-Python's interactive plotting functions.

In [2]:
matplotlib.use('Qt5Agg')

Retrieve the storage location of the `sample` data, and download the dataset if it cannot be found.

In [3]:
sample_data_dir = mne.datasets.sample.data_path()

# Convert to a pathlib.Path for more convenience
sample_data_dir = pathlib.Path(sample_data_dir)
sample_data_dir

Using default location ~/mne_data for sample...
Creating ~/mne_data


Downloading file 'MNE-sample-data-processed.tar.gz' from 'https://osf.io/86qa2/download?version=6' to 'C:\Users\eraym\mne_data'.
100%|######################################| 1.65G/1.65G [00:00<00:00, 830GB/s]
Untarring contents of 'C:\Users\eraym\mne_data\MNE-sample-data-processed.tar.gz' to 'C:\Users\eraym\mne_data'


WindowsPath('C:/Users/eraym/mne_data/MNE-sample-data')

## Load some raw data!

In [4]:
raw_path = sample_data_dir / 'MEG' / 'sample' / 'sample_audvis_raw.fif'
raw = mne.io.read_raw(raw_path)
raw

Opening raw data file C:\Users\eraym\mne_data\MNE-sample-data\MEG\sample\sample_audvis_raw.fif...
    Read a total of 3 projection items:
        PCA-v1 (1 x 102)  idle
        PCA-v2 (1 x 102)  idle
        PCA-v3 (1 x 102)  idle
    Range : 25800 ... 192599 =     42.956 ...   320.670 secs
Ready.


0,1
Measurement date,"December 03, 2002 19:01:10 GMT"
Experimenter,MEG
Digitized points,146 points
Good channels,"204 Gradiometers, 102 Magnetometers, 9 Stimulus, 60 EEG, 1 EOG"
Bad channels,"MEG 2443, EEG 053"
EOG channels,EOG 061
ECG channels,Not available
Sampling frequency,600.61 Hz
Highpass,0.10 Hz
Lowpass,172.18 Hz


## Let's visualize the raw data!

In [5]:
raw.plot()

Using matplotlib as 2D backend.


<MNEBrowseFigure size 800x800 with 5 Axes>

## Extract events from the `STIM` channels

In [6]:
events = mne.find_events(raw)

320 events found
Event IDs: [ 1  2  3  4  5 32]


In [7]:
event_id = {
    'Auditory/Left': 1,
    'Auditory/Right': 2,
    'Visual/Left': 3,
    'Visual/Right': 4,
    'Smiley': 5,
    'Button': 32
}
event_id

{'Auditory/Left': 1,
 'Auditory/Right': 2,
 'Visual/Left': 3,
 'Visual/Right': 4,
 'Smiley': 5,
 'Button': 32}

In [8]:
len(events[events[:, 2] == 32])

16

<div class="alert alert-success">
    <b>EXERCISE</b>:
     <ul>
         <li>How many <strong>visual</strong> events are in the data?</li>
    </ul>
</div>

In [11]:
len(events[events[:, 2] == 3]) + len(events[events[:, 2] == 4]) 

144

## Plot the raw data again, but add event markers

In [12]:
raw.plot(events=events, event_id=event_id)

<MNEBrowseFigure size 800x800 with 5 Axes>

## Gather some info about the data

In [13]:
raw.info

0,1
Measurement date,"December 03, 2002 19:01:10 GMT"
Experimenter,MEG
Digitized points,146 points
Good channels,"204 Gradiometers, 102 Magnetometers, 9 Stimulus, 60 EEG, 1 EOG"
Bad channels,"MEG 2443, EEG 053"
EOG channels,EOG 061
ECG channels,Not available
Sampling frequency,600.61 Hz
Highpass,0.10 Hz
Lowpass,172.18 Hz


In [14]:
raw.info['meas_date']

datetime.datetime(2002, 12, 3, 19, 1, 10, 720100, tzinfo=datetime.timezone.utc)

In [15]:
raw.info['sfreq']

600.614990234375

In [16]:
raw.info['bads']

['MEG 2443', 'EEG 053']

In [17]:
raw.ch_names[:10]

['MEG 0113',
 'MEG 0112',
 'MEG 0111',
 'MEG 0122',
 'MEG 0123',
 'MEG 0121',
 'MEG 0132',
 'MEG 0133',
 'MEG 0131',
 'MEG 0143']

In [18]:
raw.info['chs'][0]

{'scanno': 1,
 'logno': 113,
 'kind': 1 (FIFFV_MEG_CH),
 'range': 0.00030517578125,
 'cal': 3.1600000394149674e-09,
 'coil_type': 3012 (FIFFV_COIL_VV_PLANAR_T1),
 'loc': array([-0.1066    ,  0.0464    , -0.0604    , -0.0127    ,  0.0057    ,
        -0.99990302, -0.186801  , -0.98240298, -0.0033    , -0.98232698,
         0.18674099,  0.013541  ]),
 'unit': 201 (FIFF_UNIT_T_M),
 'unit_mul': 0 (FIFF_UNITM_NONE),
 'ch_name': 'MEG 0113',
 'coord_frame': 1 (FIFFV_COORD_DEVICE)}

## Visualize the sensor locations

In [19]:
raw.plot_sensors(ch_type='eeg')

<Figure size 640x640 with 1 Axes>

In [20]:
raw.plot_sensors(kind='3d', ch_type='eeg')

<Figure size 640x640 with 1 Axes>

## Mark channels as bad

Mark an additional EEG channel as bad and view the topoplot.

In [21]:
raw.info['bads']

['MEG 2443', 'EEG 053']

In [22]:
raw.info['bads'] += ['EEG 051']
raw.plot_sensors(ch_type='eeg')

<Figure size 640x640 with 1 Axes>

## Select only a subset of the channels

In [23]:
raw_eeg = raw.copy().pick_types(meg=False, eeg=True, eog=True, exclude=[])
len(raw_eeg.ch_names)

Removing projector <Projection | PCA-v1, active : False, n_channels : 102>
Removing projector <Projection | PCA-v2, active : False, n_channels : 102>
Removing projector <Projection | PCA-v3, active : False, n_channels : 102>


61

In [24]:
raw_eeg.info

0,1
Measurement date,"December 03, 2002 19:01:10 GMT"
Experimenter,MEG
Digitized points,146 points
Good channels,"60 EEG, 1 EOG"
Bad channels,"EEG 053, EEG 051"
EOG channels,EOG 061
ECG channels,Not available
Sampling frequency,600.61 Hz
Highpass,0.10 Hz
Lowpass,172.18 Hz


In [25]:
raw_eeg.plot(events=events, event_id=event_id)

<MNEBrowseFigure size 800x800 with 4 Axes>

<div class="alert alert-success">
    <b>EXERCISE</b>:
     <ul>
         <li>Select only MEG channels ("meg")</li>
         <li>Select only magnetometer channels ("mag")</li>
    </ul>
</div>

In [26]:
raw_eeg2 = raw.copy().pick_types(meg=True, eeg=False, eog=False, exclude=[])
raw_eeg2.info

0,1
Measurement date,"December 03, 2002 19:01:10 GMT"
Experimenter,MEG
Digitized points,146 points
Good channels,"204 Gradiometers, 102 Magnetometers"
Bad channels,MEG 2443
EOG channels,Not available
ECG channels,Not available
Sampling frequency,600.61 Hz
Highpass,0.10 Hz
Lowpass,172.18 Hz


In [27]:
raw_eeg3 = raw.copy().pick_types(meg='mag', eeg=False, eog=False, exclude=[])
raw_eeg3.info

0,1
Measurement date,"December 03, 2002 19:01:10 GMT"
Experimenter,MEG
Digitized points,146 points
Good channels,102 Magnetometers
Bad channels,
EOG channels,Not available
ECG channels,Not available
Sampling frequency,600.61 Hz
Highpass,0.10 Hz
Lowpass,172.18 Hz


## Crop and filter the data

In [28]:
raw_eeg_cropped = raw_eeg.copy().crop(tmax=100)
raw_eeg_cropped.times[-1]

99.99916914588277

In [32]:
raw_eeg_cropped.load_data()
raw_eeg_cropped_filtered = raw_eeg_cropped.copy().filter(l_freq=0.1, h_freq=40)

Reading 0 ... 60061  =      0.000 ...    99.999 secs...
Filtering raw data in 1 contiguous segment
Setting up band-pass filter from 0.1 - 40 Hz

FIR filter parameters
---------------------
Designing a one-pass, zero-phase, non-causal bandpass filter:
- Windowed time-domain design (firwin) method
- Hamming window with 0.0194 passband ripple and 53 dB stopband attenuation
- Lower passband edge: 0.10
- Lower transition bandwidth: 0.10 Hz (-6 dB cutoff frequency: 0.05 Hz)
- Upper passband edge: 40.00 Hz
- Upper transition bandwidth: 10.00 Hz (-6 dB cutoff frequency: 45.00 Hz)
- Filter length: 19821 samples (33.001 sec)



[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.
[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:    0.0s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   2 out of   2 | elapsed:    0.0s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   3 out of   3 | elapsed:    0.0s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   4 out of   4 | elapsed:    0.0s remaining:    0.0s
[Parallel(n_jobs=1)]: Done  60 out of  60 | elapsed:    0.5s finished


In [33]:
raw_eeg_cropped.plot(events=events, event_id=event_id)
raw_eeg_cropped_filtered.plot(events=events, event_id=event_id)

<MNEBrowseFigure size 800x800 with 4 Axes>

In [None]:
import matplotlib.pyplot as plt

fig, ax = plt.subplots(2)

raw_eeg_cropped.plot_psd(ax=ax[0], show=False)
raw_eeg_cropped_filtered.plot_psd(ax=ax[1], show=False)

ax[0].set_title('PSD before filtering')
ax[1].set_title('PSD after filtering')
ax[1].set_xlabel('Frequency (Hz)')
fig.set_tight_layout(True)
plt.show()

Effective window size : 3.410 (s)


[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.
[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:    0.0s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:    0.0s finished


Effective window size : 3.410 (s)


[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.
[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:    0.0s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:    0.0s finished
  plt.show()


Channels marked as bad:
['MEG 2443', 'EEG 053']
Channels marked as bad:
['MEG 2443', 'EEG 053']
Channels marked as bad:
['EEG 053', 'EEG 051']
Channels marked as bad:
['EEG 053', 'EEG 051']


<div class="alert alert-success">
    <b>EXERCISE</b>:
     <ul>
         <li>Filter the raw data with a 1 Hz high-pass and a 30 Hz low-pass filter and plot the PSD.</li>
    </ul>
</div>

In [None]:
raw_eeg_cropped_filtered2 = raw_eeg_cropped.copy().filter(l_freq=1, h_freq=30)

In [None]:
fig, ax = plt.subplots(2)

raw_eeg_cropped.plot_psd(ax=ax[0], show=False)
raw_eeg_cropped_filtered2.plot_psd(ax=ax[1], show=False)

ax[0].set_title('PSD before filtering')
ax[1].set_title('PSD after filtering')
ax[1].set_xlabel('Frequency (Hz)')
fig.set_tight_layout(True)
plt.show()

## Save the data

In [None]:
raw_eeg_cropped_filtered.save(pathlib.Path('out_data') / 'eeg_cropped_filt_raw.fif', 
                              overwrite=True)