### 1. Retention times vs molecular weight

First, for each of the PEG standards, the relationship between retention time and molecular weight is given below.

In [1]:
import pandas as pd
import numpy as np
import glob 
import matplotlib.pyplot as plt


PEG_200 = {'Peak time':[4.20, 4.76, 5.48, 6.45],'Molecular weight':[150,194,238,282]}

PEG_300 = {'Peak time':[4.20, 4.76, 5.48, 6.45, 7.74, 9.45, 11.11, 12.30 ],'Molecular weight':[150, 194, 238, 282, 326, 370, 414, 458]}

PEG_400 = {'Peak time':[4.76, 5.48, 6.45, 7.74, 9.45, 11.11, 12.30, 13.20, 13.97, 14.63],'Molecular weight':[194, 238, 282, 326, 370, 414, 458, 502, 546, 590]}

PEG_1000 = {'Peak time':[14.63, 15.23, 15.78, 16.27, 16.72, 17.14, 17.54, 17.91, 18.28, 18.61, 18.96, 19.27, 19.59, 19.87, 20.17, 20.45, 20.72],'Molecular weight':[590, 634, 678, 722, 766, 810, 854, 898, 942, 986, 1030, 1074, 1118, 1162, 1206, 1250, 1294 ]}




In [2]:
df_200 = pd.DataFrame(data=PEG_200)
df_200t = df_200.style.set_caption("PEG 200")
df_200t

Unnamed: 0,Peak time,Molecular weight
0,4.2,150
1,4.76,194
2,5.48,238
3,6.45,282


In [3]:
df_300 = pd.DataFrame(data=PEG_300)
df_300t = df_300.style.set_caption("PEG 300")
df_300t

Unnamed: 0,Peak time,Molecular weight
0,4.2,150
1,4.76,194
2,5.48,238
3,6.45,282
4,7.74,326
5,9.45,370
6,11.11,414
7,12.3,458


In [4]:
df_400 = pd.DataFrame(data=PEG_400)
df_400t = df_400.style.set_caption("PEG 400")
df_400t

Unnamed: 0,Peak time,Molecular weight
0,4.76,194
1,5.48,238
2,6.45,282
3,7.74,326
4,9.45,370
5,11.11,414
6,12.3,458
7,13.2,502
8,13.97,546
9,14.63,590


In [5]:
df_1000 = pd.DataFrame(data=PEG_1000)
df_1000t = df_1000.style.set_caption("PEG 1000")
df_1000t

Unnamed: 0,Peak time,Molecular weight
0,14.63,590
1,15.23,634
2,15.78,678
3,16.27,722
4,16.72,766
5,17.14,810
6,17.54,854
7,17.91,898
8,18.28,942
9,18.61,986


### 2. Calibration curves nanofiltration

Below, the data gathered for various concentrations (50, 200 and 400 ppm) is imported and averages are calculated since every sample was analyzed 3 times.

In [6]:
# getting csv files from the specified folder
# double backslashes are used because a single backslash is used as an end statement in python

path = 'C:\\Users\\cdierend\\OneDrive - UGent\\Universiteit Gent\\Research\\FWO Biostable\\6_MWCO\\Exp_6.1\\2_RawData\\20220202_NF_mix_calibration\\'
filenames = glob.glob(path + "\*.csv")

dataframes_list = []

# for loop to iterate over all csv files in the specified folder

for file in filenames: 
    temp_df = pd.read_csv(file, encoding = "UTF-16", sep = '\t', decimal = ',', names = ["Peak number","Retention time", "Area"])
    temp_df['Retention time'] = pd.to_numeric(temp_df['Retention time'])
    temp_df['Area'] = pd.to_numeric(temp_df['Area'])
    index = temp_df.index
    index.name = file
    dataframes_list.append(temp_df)
    
    
for dataset in dataframes_list:
    display(dataset)

Unnamed: 0_level_0,Peak number,Retention time,Area
C:\Users\cdierend\OneDrive - UGent\Universiteit Gent\Research\FWO Biostable\6_MWCO\Exp_6.1\2_RawData\20220202_NF_mix_calibration\20220202_CD_NF_MIX_200_1.CSV,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
0,1,4.177238,192.176529
1,2,4.742815,2203.931152
2,3,5.462861,2671.651123
3,4,6.425039,2381.671387
4,5,7.715343,1564.802612
5,6,9.38484,1119.617676
6,7,11.06131,682.281006
7,8,12.235253,454.081512
8,9,13.138577,259.420624
9,10,13.901608,178.365509


Unnamed: 0_level_0,Peak number,Retention time,Area
C:\Users\cdierend\OneDrive - UGent\Universiteit Gent\Research\FWO Biostable\6_MWCO\Exp_6.1\2_RawData\20220202_NF_mix_calibration\20220202_CD_NF_MIX_200_2.CSV,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
0,1,4.182164,294.50293
1,2,4.729541,2577.244141
2,3,5.450314,3230.142822
3,4,6.403797,2524.185791
4,5,7.685133,1868.479126
5,6,9.386229,1090.676636
6,7,11.047713,833.3797
7,8,12.225723,462.311859
8,9,13.146482,265.882233
9,10,13.899796,179.382324


Unnamed: 0_level_0,Peak number,Retention time,Area
C:\Users\cdierend\OneDrive - UGent\Universiteit Gent\Research\FWO Biostable\6_MWCO\Exp_6.1\2_RawData\20220202_NF_mix_calibration\20220202_CD_NF_MIX_200_3.CSV,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
0,1,4.162761,331.298553
1,2,4.720312,2479.748047
2,3,5.441193,3255.488037
3,4,6.408759,2481.852783
4,5,7.669256,1829.964355
5,6,9.363254,1052.818359
6,7,11.053404,777.350159
7,8,12.2053,435.851715
8,9,13.129954,265.774323
9,10,13.887945,176.318954


Unnamed: 0_level_0,Peak number,Retention time,Area
C:\Users\cdierend\OneDrive - UGent\Universiteit Gent\Research\FWO Biostable\6_MWCO\Exp_6.1\2_RawData\20220202_NF_mix_calibration\20220202_CD_NF_MIX_400_1.CSV,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
0,1,4.183094,1076.675537
1,2,4.724296,7220.896484
2,3,5.431962,8112.047852
3,4,6.39059,6061.312988
4,5,7.653795,4274.445801
5,6,9.353193,2559.442139
6,7,11.040033,1809.665771
7,8,12.232685,1131.493652
8,9,13.148311,597.939087
9,10,13.909313,425.287964


Unnamed: 0_level_0,Peak number,Retention time,Area
C:\Users\cdierend\OneDrive - UGent\Universiteit Gent\Research\FWO Biostable\6_MWCO\Exp_6.1\2_RawData\20220202_NF_mix_calibration\20220202_CD_NF_MIX_400_2.CSV,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
0,1,4.191647,943.69635
1,2,4.742314,6631.546875
2,3,5.463537,7578.331543
3,4,6.411952,5989.44043
4,5,7.693782,4208.971191
5,6,9.386427,2585.57251
6,7,11.060834,1824.893188
7,8,12.235903,1096.19458
8,9,13.154125,609.130737
9,10,13.925736,398.699615


Unnamed: 0_level_0,Peak number,Retention time,Area
C:\Users\cdierend\OneDrive - UGent\Universiteit Gent\Research\FWO Biostable\6_MWCO\Exp_6.1\2_RawData\20220202_NF_mix_calibration\20220202_CD_NF_MIX_400_3.CSV,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
0,1,4.18577,953.017822
1,2,4.732692,6604.410645
2,3,5.439216,7500.71582
3,4,6.393296,6083.070801
4,5,7.655911,4165.673828
5,6,9.334863,2575.481934
6,7,11.039319,1894.908936
7,8,12.21399,1061.878052
8,9,13.123474,598.805237
9,10,13.896055,382.222168


Unnamed: 0_level_0,Peak number,Retention time,Area
C:\Users\cdierend\OneDrive - UGent\Universiteit Gent\Research\FWO Biostable\6_MWCO\Exp_6.1\2_RawData\20220202_NF_mix_calibration\20220202_CD_NF_MIX_50_1.CSV,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
0,1,4.139738,428.56665
1,2,4.733204,379.394928
2,3,5.458529,527.785645
3,4,6.405911,434.384766
4,5,7.701005,324.676666
5,6,9.386744,175.361008
6,7,11.073651,172.827682
7,8,15.162521,63.817566
8,9,16.164377,208.179657
9,10,16.584312,259.41333


Unnamed: 0_level_0,Peak number,Retention time,Area
C:\Users\cdierend\OneDrive - UGent\Universiteit Gent\Research\FWO Biostable\6_MWCO\Exp_6.1\2_RawData\20220202_NF_mix_calibration\20220202_CD_NF_MIX_50_2.CSV,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
0,1,4.731463,360.320831
1,2,5.463006,530.971741
2,3,6.413262,449.791321
3,4,7.709707,335.860901
4,5,9.393996,219.473984
5,6,11.08273,145.048615
6,7,12.23504,97.695282
7,8,13.122313,45.399284
8,9,13.927246,37.622074
9,10,15.125947,56.942005


Unnamed: 0_level_0,Peak number,Retention time,Area
C:\Users\cdierend\OneDrive - UGent\Universiteit Gent\Research\FWO Biostable\6_MWCO\Exp_6.1\2_RawData\20220202_NF_mix_calibration\20220202_CD_NF_MIX_50_3.CSV,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
0,1,4.693408,455.630859
1,2,5.449098,524.039185
2,3,6.404566,435.222992
3,4,7.685017,319.118896
4,5,9.363736,180.455322
5,6,11.073334,102.143494
6,7,12.208297,88.461693
7,8,13.136082,57.442104
8,9,14.560866,34.809879
9,10,15.101143,39.01635
