In [1]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import math

import warnings
warnings.filterwarnings('ignore')

# General Functions

In [2]:
#doe1['Total Gas Flow Rate (sccm)'][2]/2
def rh(td, t):
    rh = 100*(math.exp((17.625*td)/(243.04+td))/math.exp((17.625*t)/(243.04+t)))
    return rh

In [3]:
df_columns = ['ID','datetime',
           'Annealing H2 (sccm)',
           'Growth H2 (sccm)','Growth CH4 (sccm)','Growth He (sccm)',
           'Cooling H2 (sccm)','Cooling CH4 (sccm)','Cooling He (sccm)',
           'Growth Time (min)',
           'Dew Point (C)','Temperature (C)','Relative Humidity (pct)',
           'Res: Graphene Presence',
           'CP: Total Flow Rate (sccm)','CP: CH4/Total','CP: CH4/H2','CP: Dil CH4', 'CP: Set No']

# DoE Set 1

In [4]:
doe1 = pd.read_csv('Set 1.csv', header=2)

In [5]:
doe1 = doe1.drop(columns=['Unnamed: 0','Regions', 'Unnamed: 6', 'Folder Name','Link','Coverage','Avg. Crystal Size','Nucleation Density'])

In [6]:
doe1 = doe1.rename(columns={'Unnamed: 3':'Sample ID'})

In [7]:
doe1.insert(4, 'Dew Point(C)', [np.nan,np.nan,np.nan,np.nan,np.nan,np.nan,np.nan,np.nan,np.nan,np.nan,np.nan,1.9,1.74,5.3, -1.86, -1.86])

In [8]:
doe1.insert(5, 'Temperature(C)', [np.nan,np.nan,np.nan,np.nan,np.nan,np.nan,np.nan,np.nan,np.nan,np.nan,np.nan,23.2,23,23.1, 23.2, 23.2])

In [9]:
doe1

Unnamed: 0,Growth Duration (min),Total Gas Flow Rate (sccm),Sample ID,Graphene,Dew Point(C),Temperature(C)
0,15,200,20191211_1,No,,
1,15,1000,20191211_2,Yes,,
2,5,1000,20191211_3,No,,
3,5,1000,20191216_2,No,,
4,15,200,20191216_3,Maybe,,
5,15,200,20191216_4,Maybe,,
6,15,200,20191216_5,No,,
7,15,1000,20191217_1,Yes,,
8,5,1000,20191218_1,Yes,,
9,5,200,20191218_2,Yes,,


In [10]:
df_doe1 = pd.DataFrame(index=range(16), 
                       columns = df_columns)

In [11]:
for i in range(16):
    df_doe1['ID'][i] = doe1['Sample ID'][i]
    df_doe1['datetime'][i] = pd.to_datetime(doe1['Sample ID'][i][:-2])
    df_doe1['Annealing H2 (sccm)'][i] = doe1['Total Gas Flow Rate (sccm)'][i]/2
    df_doe1['Growth H2 (sccm)'][i] = doe1['Total Gas Flow Rate (sccm)'][i]/2
    df_doe1['Growth CH4 (sccm)'][i] = doe1['Total Gas Flow Rate (sccm)'][i]/200
    df_doe1['Growth He (sccm)'][i] = doe1['Total Gas Flow Rate (sccm)'][i]/2
    df_doe1['Cooling H2 (sccm)'][i] = 0
    df_doe1['Cooling CH4 (sccm)'][i] = 0
    df_doe1['Cooling He (sccm)'][i] = doe1['Total Gas Flow Rate (sccm)'][i]/2
    df_doe1['Growth Time (min)'][i] = doe1['Growth Duration (min)'][i]
    df_doe1['Dew Point (C)'][i] = doe1['Dew Point(C)'][i]
    df_doe1['Temperature (C)'][i] = doe1['Temperature(C)'][i]
    df_doe1['Relative Humidity (pct)'][i] = rh(df_doe1['Dew Point (C)'][i], df_doe1['Temperature (C)'][i])
    df_doe1['Res: Graphene Presence'][i] = doe1['Graphene'][i]
    df_doe1['CP: Total Flow Rate (sccm)'][i] = df_doe1['Growth CH4 (sccm)'][i]+df_doe1['Growth H2 (sccm)'][i]+df_doe1['Growth He (sccm)'][i]
    df_doe1['CP: CH4/Total'][i] = df_doe1['Growth CH4 (sccm)'][i]/df_doe1['CP: Total Flow Rate (sccm)'][i]
    df_doe1['CP: CH4/H2'][i] = df_doe1['Growth CH4 (sccm)'][i]/df_doe1['Growth H2 (sccm)'][i]
    df_doe1['CP: Dil CH4'][i] = False
    df_doe1['CP: Set No'][i] = 1

In [12]:
df_doe1

Unnamed: 0,ID,datetime,Annealing H2 (sccm),Growth H2 (sccm),Growth CH4 (sccm),Growth He (sccm),Cooling H2 (sccm),Cooling CH4 (sccm),Cooling He (sccm),Growth Time (min),Dew Point (C),Temperature (C),Relative Humidity (pct),Res: Graphene Presence,CP: Total Flow Rate (sccm),CP: CH4/Total,CP: CH4/H2,CP: Dil CH4,CP: Set No
0,20191211_1,2019-12-11 00:00:00,100.0,100.0,1.0,100.0,0,0,100.0,15,,,,No,201.0,0.004975,0.01,False,1
1,20191211_2,2019-12-11 00:00:00,500.0,500.0,5.0,500.0,0,0,500.0,15,,,,Yes,1005.0,0.004975,0.01,False,1
2,20191211_3,2019-12-11 00:00:00,500.0,500.0,5.0,500.0,0,0,500.0,5,,,,No,1005.0,0.004975,0.01,False,1
3,20191216_2,2019-12-16 00:00:00,500.0,500.0,5.0,500.0,0,0,500.0,5,,,,No,1005.0,0.004975,0.01,False,1
4,20191216_3,2019-12-16 00:00:00,100.0,100.0,1.0,100.0,0,0,100.0,15,,,,Maybe,201.0,0.004975,0.01,False,1
5,20191216_4,2019-12-16 00:00:00,100.0,100.0,1.0,100.0,0,0,100.0,15,,,,Maybe,201.0,0.004975,0.01,False,1
6,20191216_5,2019-12-16 00:00:00,100.0,100.0,1.0,100.0,0,0,100.0,15,,,,No,201.0,0.004975,0.01,False,1
7,20191217_1,2019-12-17 00:00:00,500.0,500.0,5.0,500.0,0,0,500.0,15,,,,Yes,1005.0,0.004975,0.01,False,1
8,20191218_1,2019-12-18 00:00:00,500.0,500.0,5.0,500.0,0,0,500.0,5,,,,Yes,1005.0,0.004975,0.01,False,1
9,20191218_2,2019-12-18 00:00:00,100.0,100.0,1.0,100.0,0,0,100.0,5,,,,Yes,201.0,0.004975,0.01,False,1


# DoE Set 2

In [13]:
doe2 = pd.read_csv('Set 2.csv', header=2)

In [14]:
doe2 = doe2.iloc[:,1:8]

In [15]:
doe2 = doe2.rename(columns={'Unnamed: 3': 'Time', 'Unnamed: 4':'Sample ID'})

In [16]:
#doe2.insert(7, 'datetime', 1)

In [17]:
#for i in range(16):
#    doe2['datetime'][i] = pd.to_datetime(doe2['Sample ID'][i][:-2]+' '+doe2['Time'][i])

In [18]:
doe2

Unnamed: 0,Growth Duration (min),Total Gas Flow Rate (sccm),Time,Sample ID,Graphene,Dew,Temp
0,7,200,2:35 PM,20200307_1,No,-1.72,22.5
1,7,280,1:00 AM,20200308_1,No,-1.04,22.8
2,5,280,7:26 PM,20200308_2,Yes,0.44,23.3
3,5,280,1:50 AM,20200309_1,Yes,0.98,23.3
4,7,200,4:10 AM,20200309_2,No,1.42,23.7
5,7,200,4:45 PM,20200310_1,No,5.44,23.2
6,7,200,8:02 PM,20200310_2,No,5.04,23.1
7,7,280,1:07 AM,20200311_1,Yes,5.32,23.2
8,5,280,2:58 PM,20200311_2,Maybe,5.56,23.1
9,5,200,5:47 PM,20200312_1,No,11.38,23.8


In [19]:
df_doe2 = pd.DataFrame(index=range(16), 
                       columns = df_columns)

In [20]:
for i in range(16):
    df_doe2['ID'][i] = doe2['Sample ID'][i]
    df_doe2['datetime'][i] = pd.to_datetime(doe2['Sample ID'][i][:-2]+' '+doe2['Time'][i])
    df_doe2['Annealing H2 (sccm)'][i] = doe2['Total Gas Flow Rate (sccm)'][i]/2
    df_doe2['Growth H2 (sccm)'][i] = doe2['Total Gas Flow Rate (sccm)'][i]/2
    df_doe2['Growth CH4 (sccm)'][i] = doe2['Total Gas Flow Rate (sccm)'][i]/200
    df_doe2['Growth He (sccm)'][i] = doe2['Total Gas Flow Rate (sccm)'][i]/2
    df_doe2['Cooling H2 (sccm)'][i] = 0
    df_doe2['Cooling CH4 (sccm)'][i] = 0
    df_doe2['Cooling He (sccm)'][i] = doe2['Total Gas Flow Rate (sccm)'][i]/2
    df_doe2['Growth Time (min)'][i] = doe2['Growth Duration (min)'][i]
    df_doe2['Dew Point (C)'][i] = doe2['Dew'][i]
    df_doe2['Temperature (C)'][i] = doe2['Temp'][i]
    df_doe2['Relative Humidity (pct)'][i] = rh(df_doe2['Dew Point (C)'][i], df_doe2['Temperature (C)'][i])
    df_doe2['Res: Graphene Presence'][i] = doe2['Graphene'][i]
    df_doe2['CP: Total Flow Rate (sccm)'][i] = df_doe2['Growth CH4 (sccm)'][i]+df_doe2['Growth H2 (sccm)'][i]+df_doe2['Growth He (sccm)'][i]
    df_doe2['CP: CH4/Total'][i] = df_doe2['Growth CH4 (sccm)'][i]/df_doe2['CP: Total Flow Rate (sccm)'][i]
    df_doe2['CP: CH4/H2'][i] = df_doe2['Growth CH4 (sccm)'][i]/df_doe2['Growth H2 (sccm)'][i]
    df_doe2['CP: Dil CH4'][i] = False
    df_doe2['CP: Set No'][i] = 2

In [21]:
df_doe2

Unnamed: 0,ID,datetime,Annealing H2 (sccm),Growth H2 (sccm),Growth CH4 (sccm),Growth He (sccm),Cooling H2 (sccm),Cooling CH4 (sccm),Cooling He (sccm),Growth Time (min),Dew Point (C),Temperature (C),Relative Humidity (pct),Res: Graphene Presence,CP: Total Flow Rate (sccm),CP: CH4/Total,CP: CH4/H2,CP: Dil CH4,CP: Set No
0,20200307_1,2020-03-07 14:35:00,100.0,100.0,1.0,100.0,0,0,100.0,7,-1.72,22.5,19.808864,No,201.0,0.004975,0.01,False,2
1,20200308_1,2020-03-08 01:00:00,140.0,140.0,1.4,140.0,0,0,140.0,7,-1.04,22.8,20.446319,No,281.4,0.004975,0.01,False,2
2,20200308_2,2020-03-08 19:26:00,140.0,140.0,1.4,140.0,0,0,140.0,5,0.44,23.3,22.090501,Yes,281.4,0.004975,0.01,False,2
3,20200309_1,2020-03-09 01:50:00,140.0,140.0,1.4,140.0,0,0,140.0,5,0.98,23.3,22.967499,Yes,281.4,0.004975,0.01,False,2
4,20200309_2,2020-03-09 04:10:00,100.0,100.0,1.0,100.0,0,0,100.0,7,1.42,23.7,23.139883,No,201.0,0.004975,0.01,False,2
5,20200310_1,2020-03-10 16:45:00,100.0,100.0,1.0,100.0,0,0,100.0,7,5.44,23.2,31.664745,No,201.0,0.004975,0.01,False,2
6,20200310_2,2020-03-10 20:02:00,100.0,100.0,1.0,100.0,0,0,100.0,7,5.04,23.1,30.983451,No,201.0,0.004975,0.01,False,2
7,20200311_1,2020-03-11 01:07:00,140.0,140.0,1.4,140.0,0,0,140.0,7,5.32,23.2,31.402091,Yes,281.4,0.004975,0.01,False,2
8,20200311_2,2020-03-11 14:58:00,140.0,140.0,1.4,140.0,0,0,140.0,5,5.56,23.1,32.122949,Maybe,281.4,0.004975,0.01,False,2
9,20200312_1,2020-03-12 17:47:00,100.0,100.0,1.0,100.0,0,0,100.0,5,11.38,23.8,45.673245,No,201.0,0.004975,0.01,False,2


# DoE Set 3

In [22]:
doe3 = pd.read_csv('Set 3.csv', header=2)

In [23]:
doe3 = doe3.iloc[:,1:8]

In [24]:
doe3 = doe3.rename(columns={'Unnamed: 1': 'Growth Duration (min)', 'Unnamed: 3': 'Time', 'Unnamed: 4':'Sample ID'})

In [25]:
doe3

Unnamed: 0,Growth Duration (min),Total Gas Flow Rate (sccm),Time,Sample ID,Graphene,Dew,Temp
0,7,280,1:07 PM,20200629_1,Maybe,13.04,25.5
1,7,280,11:00 AM,20200630_1,No,12.96,25.5
2,7,1000,1:40 PM,20200630_2,Yes,12.74,25.7
3,7,760,4:56 PM,20200702_1,Yes,12.3,25.2
4,7,760,7:31 PM,20200702_2,Yes,12.76,26.0
5,7,520,10:35 PM,20200702_3,Yes,13.04,26.0
6,7,520,1:52 AM,20200703_1,Yes,13.42,25.8
7,7,520,11:00 PM,20200703_2,Yes,13.2,26.0
8,7,1000,2:20 AM,20200704_1,Yes,13.16,26.6
9,7,760,3:55 PM,20200705_1,Yes,13.2,25.5


In [26]:
df_doe3 = pd.DataFrame(index=range(16), 
                       columns = df_columns)

In [27]:
for i in range(16):
    df_doe3['ID'][i] = doe3['Sample ID'][i]
    df_doe3['datetime'][i] = pd.to_datetime(doe3['Sample ID'][i][:-2]+' '+doe3['Time'][i])
    df_doe3['Annealing H2 (sccm)'][i] = doe3['Total Gas Flow Rate (sccm)'][i]/2
    df_doe3['Growth H2 (sccm)'][i] = doe3['Total Gas Flow Rate (sccm)'][i]/2
    df_doe3['Growth CH4 (sccm)'][i] = doe3['Total Gas Flow Rate (sccm)'][i]/200
    df_doe3['Growth He (sccm)'][i] = doe3['Total Gas Flow Rate (sccm)'][i]/2
    df_doe3['Cooling H2 (sccm)'][i] = 0
    df_doe3['Cooling CH4 (sccm)'][i] = 0
    df_doe3['Cooling He (sccm)'][i] = doe3['Total Gas Flow Rate (sccm)'][i]/2
    df_doe3['Growth Time (min)'][i] = doe3['Growth Duration (min)'][i]
    df_doe3['Dew Point (C)'][i] = doe3['Dew'][i]
    df_doe3['Temperature (C)'][i] = doe3['Temp'][i]
    df_doe3['Relative Humidity (pct)'][i] = rh(df_doe3['Dew Point (C)'][i], df_doe3['Temperature (C)'][i])
    df_doe3['Res: Graphene Presence'][i] = doe3['Graphene'][i]
    df_doe3['CP: Total Flow Rate (sccm)'][i] = df_doe3['Growth CH4 (sccm)'][i]+df_doe3['Growth H2 (sccm)'][i]+df_doe3['Growth He (sccm)'][i]
    df_doe3['CP: CH4/Total'][i] = df_doe3['Growth CH4 (sccm)'][i]/df_doe3['CP: Total Flow Rate (sccm)'][i]
    df_doe3['CP: CH4/H2'][i] = df_doe3['Growth CH4 (sccm)'][i]/df_doe3['Growth H2 (sccm)'][i]
    df_doe3['CP: Dil CH4'][i] = False
    df_doe3['CP: Set No'][i] = 3

In [28]:
df_doe3

Unnamed: 0,ID,datetime,Annealing H2 (sccm),Growth H2 (sccm),Growth CH4 (sccm),Growth He (sccm),Cooling H2 (sccm),Cooling CH4 (sccm),Cooling He (sccm),Growth Time (min),Dew Point (C),Temperature (C),Relative Humidity (pct),Res: Graphene Presence,CP: Total Flow Rate (sccm),CP: CH4/Total,CP: CH4/H2,CP: Dil CH4,CP: Set No
0,20200629_1,2020-06-29 13:07:00,140.0,140.0,1.4,140.0,0,0,140.0,7,13.04,25.5,46.01787,Maybe,281.4,0.004975,0.01,False,3
1,20200630_1,2020-06-30 11:00:00,140.0,140.0,1.4,140.0,0,0,140.0,7,12.96,25.5,45.777947,No,281.4,0.004975,0.01,False,3
2,20200630_2,2020-06-30 13:40:00,500.0,500.0,5.0,500.0,0,0,500.0,7,12.74,25.7,44.591318,Yes,1005.0,0.004975,0.01,False,3
3,20200702_1,2020-07-02 16:56:00,380.0,380.0,3.8,380.0,0,0,380.0,7,12.3,25.2,44.629359,Yes,763.8,0.004975,0.01,False,3
4,20200702_2,2020-07-02 19:31:00,380.0,380.0,3.8,380.0,0,0,380.0,7,12.76,26.0,43.863161,Yes,763.8,0.004975,0.01,False,3
5,20200702_3,2020-07-02 22:35:00,260.0,260.0,2.6,260.0,0,0,260.0,7,13.04,26.0,44.673694,Yes,522.6,0.004975,0.01,False,3
6,20200703_1,2020-07-03 01:52:00,260.0,260.0,2.6,260.0,0,0,260.0,7,13.42,25.8,46.340437,Yes,522.6,0.004975,0.01,False,3
7,20200703_2,2020-07-03 23:00:00,260.0,260.0,2.6,260.0,0,0,260.0,7,13.2,26.0,45.142752,Yes,522.6,0.004975,0.01,False,3
8,20200704_1,2020-07-04 02:20:00,500.0,500.0,5.0,500.0,0,0,500.0,7,13.16,26.6,43.457823,Yes,1005.0,0.004975,0.01,False,3
9,20200705_1,2020-07-05 15:55:00,380.0,380.0,3.8,380.0,0,0,380.0,7,13.2,25.5,46.501041,Yes,763.8,0.004975,0.01,False,3


# DoE Set 4

In [58]:
# Constants: 

k_doe4 = 1.716

In [59]:
doe4 = pd.read_csv('Set 4.csv')

In [60]:
doe4 = doe4.iloc[:, 1:14]

In [61]:
doe4

Unnamed: 0,Total Gas Flow Rate (sccm),Growth Duration (min),Cooling Type,Gas Flow Rates (He:CH4:H2),Polishing Data,Name,Sample Name,Time of Experiment,SEM,Temperature,Dew Point,Relative Humidity,Graphene Presence
0,500,5.0,NC,475 : 1K : 25,AS_20200921_1,AS,20200921_1,5:00 PM,AS,22.5,7.1,37.040835,No
1,500,5.0,GC,475 : 1K : 25,AS_20200921_1,AS,20200921_2,8:20 PM,AS,23.0,7.98,38.158064,No
2,1000,5.0,GC,950 : 2K : 50,AS_20200922_1,AS,20200922_1,12:50 AM,AS,22.5,8.76,41.467763,Yes
3,1000,5.0,GC,950 : 2K : 50,AS_20200922_1,AS,20200922_2,10:50 AM,AS,22.5,11.38,49.40754,Yes
4,500,5.0,NC,475 : 1K : 25,AS_20200922_2,AS,20200922_3,2:25 PM,AS,23.0,11.24,47.489815,No
5,500,5.0,GC,475 : 1K : 25,AS_20200922_2,AS,20200922_4,8:30 PM,AS,23.3,10.82,45.354451,No
6,500,7.5,NC,475 : 1K : 25,AS_20200923_1,AS,20200923_2,9:45 PM,MS,22.9,9.92,43.757547,No
7,1000,10.0,NC,950 : 2K : 50,AS_20200923_1,AS,20200924_1,12:45 AM,MS,23.0,10.34,44.731545,Yes
8,1000,7.5,GC,950 : 2K : 50,AS_20200924_1,AS,20200924_3,7:00 AM,MS,23.0,11.4,47.995561,Yes
9,1000,10.0,GC,950 : 2K : 50,AS_20200924_2,AS,20200924_4,11:00 AM,JY,23.2,11.6,48.049708,No


In [62]:
df_doe4 = pd.DataFrame(index=range(60), 
                       columns = df_columns)

In [63]:
#int(doe4['Gas Flow Rates (He:CH4:H2)'][1][:3])+int(doe4['Gas Flow Rates (He:CH4:H2)'][1][6])*k_doe4*0.99
#int(doe4['Gas Flow Rates (He:CH4:H2)'][2][6])*k_doe4*0.01
#doe4['Cooling Type'][1]

In [64]:
for i in range(60):
    df_doe4['ID'][i] = doe4['Sample Name'][i]
    df_doe4['datetime'][i] = pd.to_datetime(doe4['Sample Name'][i][:-2]+' '+doe4['Time of Experiment'][i])
    
    df_doe4['Annealing H2 (sccm)'][i] = int(doe4['Gas Flow Rates (He:CH4:H2)'][i][-2:])
    
    df_doe4['Growth H2 (sccm)'][i] = int(doe4['Gas Flow Rates (He:CH4:H2)'][i][-2:])
    df_doe4['Growth CH4 (sccm)'][i] = int(doe4['Gas Flow Rates (He:CH4:H2)'][i][6])*k_doe4*0.01
    df_doe4['Growth He (sccm)'][i] = int(doe4['Gas Flow Rates (He:CH4:H2)'][i][:3])+int(doe4['Gas Flow Rates (He:CH4:H2)'][i][6])*k_doe4*0.99
    
    if doe4['Cooling Type'][i] == 'NC':
        df_doe4['Cooling H2 (sccm)'][i] = 0
        df_doe4['Cooling CH4 (sccm)'][i] = 0
        df_doe4['Cooling He (sccm)'][i] = int(doe4['Gas Flow Rates (He:CH4:H2)'][i][:3])
    elif doe4['Cooling Type'][i] == 'GC':
        df_doe4['Cooling H2 (sccm)'][i] = int(doe4['Gas Flow Rates (He:CH4:H2)'][i][-2:])
        df_doe4['Cooling CH4 (sccm)'][i] = int(doe4['Gas Flow Rates (He:CH4:H2)'][i][6])*k_doe4*0.01
        df_doe4['Cooling He (sccm)'][i] = int(doe4['Gas Flow Rates (He:CH4:H2)'][i][:3])+int(doe4['Gas Flow Rates (He:CH4:H2)'][i][6])*k_doe4*0.99
    
    df_doe4['Growth Time (min)'][i] = doe4['Growth Duration (min)'][i]
    
    df_doe4['Dew Point (C)'][i] = doe4['Dew Point'][i]
    df_doe4['Temperature (C)'][i] = doe4['Temperature'][i]
    df_doe4['Relative Humidity (pct)'][i] = rh(df_doe4['Dew Point (C)'][i], df_doe4['Temperature (C)'][i])
    
    df_doe4['Res: Graphene Presence'][i] = doe4['Graphene Presence'][i]
    
    df_doe4['CP: Total Flow Rate (sccm)'][i] = df_doe4['Growth CH4 (sccm)'][i]+df_doe4['Growth H2 (sccm)'][i]+df_doe4['Growth He (sccm)'][i]
    df_doe4['CP: CH4/Total'][i] = df_doe4['Growth CH4 (sccm)'][i]/df_doe4['CP: Total Flow Rate (sccm)'][i]
    df_doe4['CP: CH4/H2'][i] = df_doe4['Growth CH4 (sccm)'][i]/df_doe4['Growth H2 (sccm)'][i]
    df_doe4['CP: Dil CH4'][i] = True
    df_doe4['CP: Set No'][i] = 4

In [65]:
df_doe4

Unnamed: 0,ID,datetime,Annealing H2 (sccm),Growth H2 (sccm),Growth CH4 (sccm),Growth He (sccm),Cooling H2 (sccm),Cooling CH4 (sccm),Cooling He (sccm),Growth Time (min),Dew Point (C),Temperature (C),Relative Humidity (pct),Res: Graphene Presence,CP: Total Flow Rate (sccm),CP: CH4/Total,CP: CH4/H2,CP: Dil CH4,CP: Set No
0,20200921_1,2020-09-21 17:00:00,25,25,0.01716,476.69884,0,0.0,475.0,5.0,7.1,22.5,37.040835,No,501.716,3.4e-05,0.000686,True,4
1,20200921_2,2020-09-21 20:20:00,25,25,0.01716,476.69884,25,0.01716,476.69884,5.0,7.98,23.0,38.158064,No,501.716,3.4e-05,0.000686,True,4
2,20200922_1,2020-09-22 00:50:00,50,50,0.03432,953.39768,50,0.03432,953.39768,5.0,8.76,22.5,41.467763,Yes,1003.432,3.4e-05,0.000686,True,4
3,20200922_2,2020-09-22 10:50:00,50,50,0.03432,953.39768,50,0.03432,953.39768,5.0,11.38,22.5,49.40754,Yes,1003.432,3.4e-05,0.000686,True,4
4,20200922_3,2020-09-22 14:25:00,25,25,0.01716,476.69884,0,0.0,475.0,5.0,11.24,23.0,47.489815,No,501.716,3.4e-05,0.000686,True,4
5,20200922_4,2020-09-22 20:30:00,25,25,0.01716,476.69884,25,0.01716,476.69884,5.0,10.82,23.3,45.354451,No,501.716,3.4e-05,0.000686,True,4
6,20200923_2,2020-09-23 21:45:00,25,25,0.01716,476.69884,0,0.0,475.0,7.5,9.92,22.9,43.757547,No,501.716,3.4e-05,0.000686,True,4
7,20200924_1,2020-09-24 00:45:00,50,50,0.03432,953.39768,0,0.0,950.0,10.0,10.34,23.0,44.731545,Yes,1003.432,3.4e-05,0.000686,True,4
8,20200924_3,2020-09-24 07:00:00,50,50,0.03432,953.39768,50,0.03432,953.39768,7.5,11.4,23.0,47.995561,Yes,1003.432,3.4e-05,0.000686,True,4
9,20200924_4,2020-09-24 11:00:00,50,50,0.03432,953.39768,50,0.03432,953.39768,10.0,11.6,23.2,48.049708,No,1003.432,3.4e-05,0.000686,True,4


# Concatenate DataFrames

In [37]:
#df = df_doe1.append([])
df = pd.concat([df_doe1,df_doe2,df_doe3,df_doe4], ignore_index=True)

In [38]:
# df.to_csv('DoE_Data_1_4.csv')

# Create new csv with only DoE 4 and 5

In [39]:
df = pd.read_csv("../data/DoE_Data_1_4.csv", index_col=0)
# Drop experiments without a value for %RH
df = df.dropna()
# Select experiments upto Set 3
df4 = df.loc[(df["CP: Set No"]>3)]
# Reset indexing
df4 = df4.set_index([pd.Index(np.array(range(df4.shape[0])))])

df4

Unnamed: 0,ID,datetime,Annealing H2 (sccm),Growth H2 (sccm),Growth CH4 (sccm),Growth He (sccm),Cooling H2 (sccm),Cooling CH4 (sccm),Cooling He (sccm),Growth Time (min),Dew Point (C),Temperature (C),Relative Humidity (pct),Res: Graphene Presence,CP: Total Flow Rate (sccm),CP: CH4/Total,CP: CH4/H2,CP: Dil CH4,CP: Set No,Res: pct. Coverage
0,20200921_1,09/21/20 17:00,25,25,0.01716,476.69884,0,0.0,475.0,5.0,7.1,22.5,37.040835,No,501.716,3.4e-05,0.000686,True,4,0.0
1,20200921_2,09/21/20 20:20,25,25,0.01716,476.69884,25,0.01716,476.69884,5.0,7.98,23.0,38.158064,No,501.716,3.4e-05,0.000686,True,4,0.0
2,20200922_1,09/22/20 0:50,50,50,0.03432,953.39768,50,0.03432,953.39768,5.0,8.76,22.5,41.467763,Yes,1003.432,3.4e-05,0.000686,True,4,0.108187
3,20200922_2,09/22/20 10:50,50,50,0.03432,953.39768,50,0.03432,953.39768,5.0,11.38,22.5,49.40754,Yes,1003.432,3.4e-05,0.000686,True,4,0.134163
4,20200922_3,09/22/20 14:25,25,25,0.01716,476.69884,0,0.0,475.0,5.0,11.24,23.0,47.489815,No,501.716,3.4e-05,0.000686,True,4,0.0
5,20200922_4,09/22/20 20:30,25,25,0.01716,476.69884,25,0.01716,476.69884,5.0,10.82,23.3,45.354451,No,501.716,3.4e-05,0.000686,True,4,0.0
6,20200923_2,09/23/20 21:45,25,25,0.01716,476.69884,0,0.0,475.0,7.5,9.92,22.9,43.757547,No,501.716,3.4e-05,0.000686,True,4,0.0
7,20200924_1,09/24/20 0:45,50,50,0.03432,953.39768,0,0.0,950.0,10.0,10.34,23.0,44.731545,Yes,1003.432,3.4e-05,0.000686,True,4,0.126065
8,20200924_3,09/24/20 7:00,50,50,0.03432,953.39768,50,0.03432,953.39768,7.5,11.4,23.0,47.995561,Yes,1003.432,3.4e-05,0.000686,True,4,0.054047
9,20200924_4,09/24/20 11:00,50,50,0.03432,953.39768,50,0.03432,953.39768,10.0,11.6,23.2,48.049708,No,1003.432,3.4e-05,0.000686,True,4,0.0


In [40]:
# Constants: 

k_doe5 = 1.716

In [47]:
doe5 = pd.read_csv('Set 5.csv')

In [49]:
doe5 = doe5.iloc[:, 1:14]

In [50]:
doe5

Unnamed: 0,Total Gas Flow Rate (sccm),Growth Duration (min),Cooling Type,Gas Flow Rates (He:CH4:H2),Polishing Data,Name,Sample Name,Time of Experiment,SEM,Temperature,Dew Point,Relative Humidity,Graphene Presence
0,500,7,GC,475 : 7K : 18,20210413_1,MS,20210413_1,10:50 PM,JY,21.5,1.94,27.448279,Yes
1,500,7,GC,475 : 5K : 20,20210415_1,MS,20210415_1,3:50 PM,JY,21.5,1.44,26.48406,Yes
2,500,10,GC,475 : 7K : 18,20210420_11,JY,20210420_1,10:45 AM,JY,21.2,1.06,26.249608,Yes
3,500,10,GC,475 : 5K : 20,20210421_1,JY,20210421_1,10:00 AM,JY,21.5,1.02,25.697431,Yes
4,500,10,GC,475 : 5K : 20,20210421_1,JY,20210421_2,1:00 PM,JY,22.0,-1.6,20.60192,Yes
5,500,10,GC,475 : 7K : 18,20210421_1,MS,20210421_3,6:45 PM,MS,21.5,-0.14,23.631306,Yes
6,500,10,GC,475 : 7K : 18,20210421_2,MS,20210421_4,9:45 PM,MS,22.0,1.16,25.176369,Yes
7,500,10,GC,475 : 5K : 20,20210423_1,JY,20210423_1,9:00 AM,MS,21.5,0.7,25.112063,Yes
8,500,7,GC,475 : 7K : 18,20210424_1,JY,20210424_1,10:00 AM,MS,21.2,6.36,38.113688,Yes
9,500,10,GC,475 : 7K : 18,20210508_2,AS,20210508_1,10:30 PM,AS,21.5,6.4,37.522615,Yes


In [52]:
df_doe5 = pd.DataFrame(index=range(16), 
                       columns = df_columns)

In [55]:
for i in range(16):
    df_doe5['ID'][i] = doe5['Sample Name'][i]
    df_doe5['datetime'][i] = pd.to_datetime(doe5['Sample Name'][i][:-2]+' '+doe5['Time of Experiment'][i])
    
    df_doe5['Annealing H2 (sccm)'][i] = int(doe5['Gas Flow Rates (He:CH4:H2)'][i][-2:])
    
    df_doe5['Growth H2 (sccm)'][i] = int(doe5['Gas Flow Rates (He:CH4:H2)'][i][-2:])
    df_doe5['Growth CH4 (sccm)'][i] = int(doe5['Gas Flow Rates (He:CH4:H2)'][i][6])*k_doe5*0.01
    df_doe5['Growth He (sccm)'][i] = int(doe5['Gas Flow Rates (He:CH4:H2)'][i][:3])+int(doe5['Gas Flow Rates (He:CH4:H2)'][i][6])*k_doe5*0.99
    
    if doe5['Cooling Type'][i] == 'NC':
        df_doe5['Cooling H2 (sccm)'][i] = 0
        df_doe5['Cooling CH4 (sccm)'][i] = 0
        df_doe5['Cooling He (sccm)'][i] = int(doe5['Gas Flow Rates (He:CH4:H2)'][i][:3])
    elif doe5['Cooling Type'][i] == 'GC':
        df_doe5['Cooling H2 (sccm)'][i] = int(doe5['Gas Flow Rates (He:CH4:H2)'][i][-2:])
        df_doe5['Cooling CH4 (sccm)'][i] = int(doe5['Gas Flow Rates (He:CH4:H2)'][i][6])*k_doe5*0.01
        df_doe5['Cooling He (sccm)'][i] = int(doe5['Gas Flow Rates (He:CH4:H2)'][i][:3])+int(doe5['Gas Flow Rates (He:CH4:H2)'][i][6])*k_doe5*0.99
    
    df_doe5['Growth Time (min)'][i] = doe5['Growth Duration (min)'][i]
    
    df_doe5['Dew Point (C)'][i] = doe5['Dew Point'][i]
    df_doe5['Temperature (C)'][i] = doe5['Temperature'][i]
    df_doe5['Relative Humidity (pct)'][i] = rh(df_doe5['Dew Point (C)'][i], df_doe5['Temperature (C)'][i])
    
    df_doe5['Res: Graphene Presence'][i] = doe5['Graphene Presence'][i]
    
    df_doe5['CP: Total Flow Rate (sccm)'][i] = df_doe5['Growth CH4 (sccm)'][i]+df_doe5['Growth H2 (sccm)'][i]+df_doe5['Growth He (sccm)'][i]
    df_doe5['CP: CH4/Total'][i] = df_doe5['Growth CH4 (sccm)'][i]/df_doe5['CP: Total Flow Rate (sccm)'][i]
    df_doe5['CP: CH4/H2'][i] = df_doe5['Growth CH4 (sccm)'][i]/df_doe5['Growth H2 (sccm)'][i]
    df_doe5['CP: Dil CH4'][i] = True
    df_doe5['CP: Set No'][i] = 5

In [56]:
df_doe5

Unnamed: 0,ID,datetime,Annealing H2 (sccm),Growth H2 (sccm),Growth CH4 (sccm),Growth He (sccm),Cooling H2 (sccm),Cooling CH4 (sccm),Cooling He (sccm),Growth Time (min),Dew Point (C),Temperature (C),Relative Humidity (pct),Res: Graphene Presence,CP: Total Flow Rate (sccm),CP: CH4/Total,CP: CH4/H2,CP: Dil CH4,CP: Set No
0,20210413_1,2021-04-13 22:50:00,18,18,0.12012,486.89188,18,0.12012,486.89188,7,1.94,21.5,27.448279,Yes,505.012,0.000238,0.006673,True,5
1,20210415_1,2021-04-15 15:50:00,20,20,0.0858,483.4942,20,0.0858,483.4942,7,1.44,21.5,26.48406,Yes,503.58,0.00017,0.00429,True,5
2,20210420_1,2021-04-20 10:45:00,18,18,0.12012,486.89188,18,0.12012,486.89188,10,1.06,21.2,26.249608,Yes,505.012,0.000238,0.006673,True,5
3,20210421_1,2021-04-21 10:00:00,20,20,0.0858,483.4942,20,0.0858,483.4942,10,1.02,21.5,25.697431,Yes,503.58,0.00017,0.00429,True,5
4,20210421_2,2021-04-21 13:00:00,20,20,0.0858,483.4942,20,0.0858,483.4942,10,-1.6,22.0,20.60192,Yes,503.58,0.00017,0.00429,True,5
5,20210421_3,2021-04-21 18:45:00,18,18,0.12012,486.89188,18,0.12012,486.89188,10,-0.14,21.5,23.631306,Yes,505.012,0.000238,0.006673,True,5
6,20210421_4,2021-04-21 21:45:00,18,18,0.12012,486.89188,18,0.12012,486.89188,10,1.16,22.0,25.176369,Yes,505.012,0.000238,0.006673,True,5
7,20210423_1,2021-04-23 09:00:00,20,20,0.0858,483.4942,20,0.0858,483.4942,10,0.7,21.5,25.112063,Yes,503.58,0.00017,0.00429,True,5
8,20210424_1,2021-04-24 10:00:00,18,18,0.12012,486.89188,18,0.12012,486.89188,7,6.36,21.2,38.113688,Yes,505.012,0.000238,0.006673,True,5
9,20210508_1,2021-05-08 22:30:00,18,18,0.12012,486.89188,18,0.12012,486.89188,10,6.4,21.5,37.522615,Yes,505.012,0.000238,0.006673,True,5


In [66]:
#df = df_doe1.append([])
df45 = pd.concat([df4,df_doe5], ignore_index=True)

In [69]:
df45.to_csv('DoE_Data_4_5.csv')