# 5. Optimal Top N

This notebook shows how to run the optimal Top N method on a ViMMS dataset

In [1]:
%matplotlib inline

In [2]:
%load_ext autoreload
%autoreload 2

In [3]:
import sys
sys.path.append('../..')

In [4]:
from pathlib import Path

In [5]:
from vimms.MassSpec import IndependentMassSpectrometer
from vimms.Controller import OptimalTopNController
from vimms.Environment import Environment
from vimms.Common import *

from mass_spec_utils.data_import.mzmine import load_picked_boxes

### Load the data

In [6]:
data_dir = os.path.abspath(os.path.join(os.getcwd(),'..','..','tests','integration','fixtures'))
dataset = load_obj(os.path.join(data_dir, 'QCB_22May19_1.p'))
ps = load_obj(Path(data_dir,'peak_sampler_mz_rt_int_beerqcb_fragmentation.p'))

In [7]:
box_file = str(Path(data_dir, 'QCB_22May19_1_pp.csv'))
boxes = load_picked_boxes(box_file)

### Run Controller

In [8]:
type(box_file), type(boxes), len(boxes)

(str, list, 3523)

In [9]:
rt_range = [(0, 1440)]
min_rt = rt_range[0][0]
max_rt = rt_range[0][1]

isolation_window = 1
N = 3
rt_tols = 15
mz_tols = 10
min_ms1_intensity = 1.75E5

Run the OptimalTopNController in loop

In [None]:
for i in range(5):
    # initialise mass spec and controller
    mass_spec = IndependentMassSpectrometer(POSITIVE, dataset, ps)
    controller = OptimalTopNController(POSITIVE, N, isolation_window, mz_tols, rt_tols, min_ms1_intensity, boxes)
    print('len(boxes) = %d' % len(controller.boxes))
    
    # create an environment to run both the mass spec and controller
    env = Environment(mass_spec, controller, min_rt, max_rt, progress_bar=True)

    # set the log level to WARNING so we don't see too many messages when environment is running
    set_log_level_warning()

    # run the simulation
    env.run()

    # write out mzML file
    set_log_level_debug()
    mzml_filename = 'optimaltopn_controller_%d.mzML' % i
    out_dir = os.path.join(os.getcwd(), 'results')
    env.write_mzML(out_dir, mzml_filename)

(23.600s) ms_level=1 N=3 DEW=15:   2%|█▉                                                                                                                      | 23.59999999999998/1440 [00:00<00:10, 141.61it/s]

len(boxes) = 3523


(1440.000s) ms_level=1 N=3 DEW=15: 100%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉| 1439.6000000000672/1440 [00:23<00:00, 61.53it/s]
2020-08-21 16:49:44.850 | DEBUG    | vimms.Environment:write_mzML:163 - Writing mzML file to C:\Users\joewa\Work\git\vimms\demo\02. Methods\results\optimaltopn_controller_0.mzML
2020-08-21 16:49:51.633 | DEBUG    | vimms.Environment:write_mzML:170 - mzML file successfully written!
(24.000s) ms_level=1 N=3 DEW=15:   2%|█▉                                                                                                                      | 23.99999999999998/1440 [00:00<00:10, 133.68it/s]

len(boxes) = 2951


(1440.000s) ms_level=1 N=3 DEW=15: 100%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉| 1439.6000000000533/1440 [00:24<00:00, 58.47it/s]
2020-08-21 16:50:16.261 | DEBUG    | vimms.Environment:write_mzML:163 - Writing mzML file to C:\Users\joewa\Work\git\vimms\demo\02. Methods\results\optimaltopn_controller_1.mzML
2020-08-21 16:50:21.826 | DEBUG    | vimms.Environment:write_mzML:170 - mzML file successfully written!
(25.600s) ms_level=1 N=3 DEW=15:   2%|██                                                                                                                     | 25.599999999999973/1440 [00:00<00:10, 133.65it/s]

len(boxes) = 2921


(1440.000s) ms_level=1 N=3 DEW=15: 100%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉| 1439.6000000000533/1440 [00:23<00:00, 60.53it/s]
2020-08-21 16:50:45.615 | DEBUG    | vimms.Environment:write_mzML:163 - Writing mzML file to C:\Users\joewa\Work\git\vimms\demo\02. Methods\results\optimaltopn_controller_2.mzML
2020-08-21 16:50:51.335 | DEBUG    | vimms.Environment:write_mzML:170 - mzML file successfully written!
(21.600s) ms_level=1 N=3 DEW=15:   1%|█▊                                                                                                                     | 21.599999999999987/1440 [00:00<00:12, 113.59it/s]

len(boxes) = 2907


(1440.000s) ms_level=1 N=3 DEW=15: 100%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉| 1439.6000000000536/1440 [00:26<00:00, 55.15it/s]
2020-08-21 16:51:17.446 | DEBUG    | vimms.Environment:write_mzML:163 - Writing mzML file to C:\Users\joewa\Work\git\vimms\demo\02. Methods\results\optimaltopn_controller_3.mzML
2020-08-21 16:51:22.879 | DEBUG    | vimms.Environment:write_mzML:170 - mzML file successfully written!
(25.600s) ms_level=1 N=3 DEW=15:   2%|██                                                                                                                     | 25.599999999999973/1440 [00:00<00:09, 145.45it/s]

len(boxes) = 2899


(715.200s) ms_level=1 N=3 DEW=15:  50%|███████████████████████████████████████████████████████████▌                                                            | 715.1999999999765/1440 [00:15<00:15, 46.96it/s]