In [110]:
import Pkg; Pkg.activate("..")

[32m[1m  Activating[22m[39m project at `~/SAFT_ML`


In [111]:
using CSV, DataFrames, DelimitedFiles, Clapeyron, PyCall
import PyPlot; const plt = PyPlot ;

In [112]:
# Open and structure Esper et al. Statistics data
# Set missing values to -1 for easier processing (all valid values are positive)

raw_data_statistics = CSV.read("Esper et al Statistics (CSV).csv",DataFrame,header=1) 
processed_data_statistics = raw_data_statistics[1:1842,1:15]

for i = 1:nrow(processed_data_statistics)
    processed_data_statistics[i,:p_sat_AAD_outliers] = replace(processed_data_statistics[i,:p_sat_AAD_outliers], r"[()]" => "")
    processed_data_statistics[i,:rho_vap_AAD_outliers] = replace(processed_data_statistics[i,:rho_vap_AAD_outliers], r"[()]" => "")
    processed_data_statistics[i,:p_sat_n_points_outliers] = replace(processed_data_statistics[i,:p_sat_n_points_outliers], r"[()]" => "")
    processed_data_statistics[i,:rho_vap_n_points_outliers] = replace(processed_data_statistics[i,:rho_vap_n_points_outliers], r"[()]" => "")

    processed_data_statistics[i,:p_sat_AAD_outliers] = replace(processed_data_statistics[i,:p_sat_AAD_outliers], r"-" => -1)
    processed_data_statistics[i,:rho_liq_sat_AAD] = replace(processed_data_statistics[i,:rho_liq_sat_AAD], r"-" => -1)
    processed_data_statistics[i,:rho_liq_sp_AAD] = replace(processed_data_statistics[i,:rho_liq_sp_AAD], r"-" => -1)
    processed_data_statistics[i,:rho_vap_AAD_outliers] = replace(processed_data_statistics[i,:rho_vap_AAD_outliers], r"-" => -1)
    processed_data_statistics[i,:p_sat_n_points_outliers] = replace(processed_data_statistics[i,:p_sat_n_points_outliers], r"-" => -1)
    processed_data_statistics[i,:rho_liq_sat_n_points] = replace(processed_data_statistics[i,:rho_liq_sat_n_points], r"-" => -1)
    processed_data_statistics[i,:rho_liq_sp_n_points] = replace(processed_data_statistics[i,:rho_liq_sp_n_points], r"-" => -1)
    processed_data_statistics[i,:rho_vap_n_points_outliers] = replace(processed_data_statistics[i,:rho_vap_n_points_outliers], r"-" => -1)

end

processed_data_statistics.Name = String.(processed_data_statistics.Name)
processed_data_statistics.CAS = String15.(processed_data_statistics.CAS)
processed_data_statistics.molarweight = Float64.(processed_data_statistics.molarweight)
processed_data_statistics.p_sat_AAD = Float64.(processed_data_statistics.p_sat_AAD)
processed_data_statistics.rho_liq_AAD = Float64.(processed_data_statistics.rho_liq_AAD)

processed_data_statistics.p_sat_AAD_outliers = parse.(Float64, processed_data_statistics.p_sat_AAD_outliers)
processed_data_statistics.rho_liq_sat_AAD = parse.(Float64, processed_data_statistics.rho_liq_sat_AAD)
processed_data_statistics.rho_liq_sp_AAD = parse.(Float64, processed_data_statistics.rho_liq_sp_AAD)
processed_data_statistics.rho_vap_AAD_outliers = parse.(Float64, processed_data_statistics.rho_vap_AAD_outliers)

processed_data_statistics.p_sat_n_points = Int64.(processed_data_statistics.p_sat_n_points)
processed_data_statistics.rho_liq_n_points = Int64.(processed_data_statistics.rho_liq_n_points)

processed_data_statistics.p_sat_n_points_outliers = parse.(Int64, processed_data_statistics.p_sat_n_points_outliers)
processed_data_statistics.rho_liq_sat_n_points = parse.(Int64, processed_data_statistics.rho_liq_sat_n_points)
processed_data_statistics.rho_liq_sp_n_points = parse.(Int64, processed_data_statistics.rho_liq_sp_n_points)
processed_data_statistics.rho_vap_n_points_outliers = parse.(Int64, processed_data_statistics.rho_vap_n_points_outliers)

processed_data_statistics ;

[33m[1m└ [22m[39m[90m@ CSV ~/.julia/packages/CSV/OnldF/src/file.jl:577[39m


In [113]:
# Open and structure Esper et al. SAFT parameter data
raw_data_parameters = CSV.read("SI_pcp-saft_parameters.csv",DataFrame,header=1) ;
fieldnames(typeof(raw_data_parameters))
#display(names(df)[1:20]) ;
writedlm("out.txt", names(raw_data_parameters), ' ') ;

replace!(raw_data_parameters.mu, missing => 0) ;
replace!(raw_data_parameters.kappa_ab, missing => 0) ;
replace!(raw_data_parameters.epsilon_k_ab, missing => 0) ;

raw_data_parameters.mu = Float64.(raw_data_parameters.mu)
raw_data_parameters.kappa_ab = Float64.(raw_data_parameters.kappa_ab)
raw_data_parameters.epsilon_k_ab = Float64.(raw_data_parameters.epsilon_k_ab) ;
raw_data_parameters = sort(raw_data_parameters, :molarweight) ;

In [114]:
num_rows = nrow(raw_data)
processed_data = DataFrame(
    species = fill(missing, num_rows),
    CAS = fill(missing,num_rows),
    isomeric_SMILES = fill(missing, num_rows), 
    family = fill(missing, num_rows),
    Mw = fill(missing, num_rows),
    segment = fill(missing, num_rows),
    sigma = fill(missing, num_rows),
    epsilon = fill(missing, num_rows),
    dipole = fill(missing, num_rows),
    kappa_ab = fill(missing, num_rows),
    epsilon_k_ab = fill(missing, num_rows),
    na = fill(missing, num_rows),
    nb = fill(missing, num_rows),
    interaction = fill(missing,num_rows),
    bounds_violation = fill(missing,num_rows),
    source = fill(missing, num_rows)
) ;

In [115]:
processed_data.species = raw_data_parameters.common_name
processed_data.CAS = raw_data_parameters.cas
processed_data.Mw = raw_data_parameters.molarweight
processed_data.isomeric_SMILES = raw_data_parameters.isomeric_smiles
processed_data.family = raw_data_parameters.family
processed_data.segment = raw_data_parameters.m
processed_data.sigma = raw_data_parameters.sigma
processed_data.epsilon = raw_data_parameters.epsilon_k
processed_data.dipole = raw_data_parameters.mu
processed_data.kappa_ab = raw_data_parameters.kappa_ab
processed_data.epsilon_k_ab = raw_data_parameters.epsilon_k_ab
processed_data.na = raw_data_parameters.na
processed_data.nb = raw_data_parameters.nb
processed_data.interaction = raw_data_parameters.opt
processed_data.bounds_violation = raw_data_parameters.bounds_violation
processed_data[!, :source] .= "10.1021/acs.iecr.3c02255" ;

species_names = processed_data.species ;
# processed_data = processed_data[1:1843,:] ;
filter!(row -> row.species != "cis-2-butene", processed_data)
filter!(row -> row.species != "(cis/trans)-2-butene", processed_data)
filter!(row -> row.species != "cis-2-pentene", processed_data) ;

# processed_data


In [122]:
num_rows = nrow(processed_data)
training_data = DataFrame(
    species = fill(missing, num_rows),
    CAS = fill(missing,num_rows),
    isomeric_SMILES = fill(missing, num_rows), 
    family = fill(missing, num_rows),
    Mw = fill(missing, num_rows),
    interaction = fill(missing,num_rows),
    source = fill(missing, num_rows),
    critical_temperature_K = fill(0,num_rows),
    critical_pressure_MPa = fill(0,num_rows),
    critical_volume_m3_per_mol = fill(0,num_rows),
    sat_temperatures_K = fill([0.0],num_rows),
    sat_pressures_MPa = fill([0.0],num_rows),
    sat_volumes_liq_m3_per_mol = fill([0.0],num_rows),
    sat_volumes_vap_m3_per_mol = fill([0.0],num_rows),
    
    p_sat_AAD = fill(0.0,num_rows),
    p_sat_AAD_outliers = fill(0.0,num_rows),
    rho_liq_AAD = fill(0.0,num_rows),
    rho_liq_sat_AAD = fill(0.0,num_rows),
    rho_liq_sp_AAD = fill(0.0,num_rows),
    rho_vap_AAD_outliers = fill(0.0,num_rows),

    p_sat_n_points = fill(0,num_rows),
    p_sat_n_points_outliers = fill(0,num_rows),
    rho_liq_n_points = fill(0,num_rows),
    rho_liq_sat_n_points = fill(0,num_rows),
    rho_liq_sp_n_points = fill(0,num_rows),
    rho_vap_n_points_outliers = fill(0,num_rows),
) ;

training_data.species = processed_data.species
training_data.CAS = processed_data.CAS
training_data.isomeric_SMILES = processed_data.isomeric_SMILES
training_data.family = processed_data.family
training_data.Mw = processed_data.Mw
training_data.interaction = processed_data.interaction
training_data.source = processed_data.source ;

training_data.critical_temperature_K = Float64.(training_data.critical_temperature_K)
training_data.critical_pressure_MPa = Float64.(training_data.critical_pressure_MPa)
training_data.critical_volume_m3_per_mol = Float64.(training_data.critical_volume_m3_per_mol) ;

In [123]:
# Check number of functional groups in dataset & number of species per fucntional group
unique_values = unique(processed_data[!, :family])
num_unique_values = length(unique_values)

dataset_summary = DataFrame(
    functional_group = unique_values,
    occurances = fill(0,num_unique_values)
)

for i = 1:length(unique_values)
     count_occurrences = count(x -> x == unique_values[i], processed_data.family)
     dataset_summary[i,:occurances] = count_occurrences ;
end

# dataset_summary

In [124]:
# This cell generates data for all ~1800 species in Esper et al.
num_rows = nrow(processed_data)

n = 500

for i in species_names

    row_number = findall(processed_data.species .== i)[1]
    println(row_number," ",i)

    model = PPCSAFT(i) ;
    critical_props = crit_pure(model)

    temp_range = collect(range(0.5*critical_props[1],critical_props[1],n)) ;
    sat_props = [saturation_pressure(model,temp_range[i]) for i ∈ 1:n] ;

    sat_pressures = [sat_props[i][1] for i ∈ 1:n] ;
    sat_vols_liq = [sat_props[i][2] for i ∈ 1:n] ;
    sat_vols_vap = [sat_props[i][3] for i ∈ 1:n] ;

    for i in 1:length(critical_props)
        training_data[row_number, 7 + i] = critical_props[i]
    end

    training_data[row_number,:sat_temperatures_K] = temp_range
    training_data[row_number,:sat_pressures_MPa] = sat_pressures
    training_data[row_number,:sat_volumes_liq_m3_per_mol] = sat_vols_liq
    training_data[row_number,:sat_volumes_vap_m3_per_mol] = sat_vols_vap

end


1 methane
2 ammonia
3 ammonia-d3
4 water
5 tritium oxide
6 hydrogen fluoride
7 ethyne
8 hydrogen cyanide
9 carbon monoxide
10 nitrogen
11 ethylene
12 ethylene-d4
13 nitrogen oxide
14 formaldehyde
15 ethane
16 methylamine
17 oxygen
18 silane
19 methanol
20 o-deuteromethanol
21 hydrazine
22 hydrogen sulfide
23 deuterium sulfide
24 phosphorous trihydride
25 hydrogen peroxide
26 methyl fluoride
27 hydrogen chloride
28 fluorine
29 argon
30 propyne
31 propadiene
32 acetonitrile
33 propylene
34 cyclopropane
35 ethylenimine
36 carbon dioxide
37 dinitrogen monoxide
38 acetaldehyde
39 ethylene oxide
40 propane
41 formamide
42 dimethylamine
43 ethylamine
44 nitrogen dioxide
45 formic acid
46 ethanol
47 dimethyl ether
48 methylhydrazine
49 ozone
50 methanethiol
51 fluoroethane
52 methyl chloride
53 cyanogen
54 difluoromethane
55 1-buten-3-yne
56 acrylonitrile
57 1,3-butadiene
58 2-butyne
59 1-butyne
60 propionitrile
61 acrolein
62 2-propyn-1-ol
63 1-butene
64 trans-2-butene
65 isobutylene
66 cyclo

In [125]:
# # All phase envelopes plot
# colour_grad_1 = collect(range(1,194,length(species_names)) ./255) 
# colour_grad_2 = collect(range(194,1,length(species_names)) ./255)

# plt.figure(figsize=(8, 6), dpi=400)

# for i = 1:length(species_names)

# plt.semilogx(1e-3 ./training_data[i,12],training_data[i,10], color = [colour_grad_1[i] 0 colour_grad_2[i]])
# plt.semilogx(1e-3 ./training_data[i,13],training_data[i,10],color = [colour_grad_1[i] 0 colour_grad_2[i]])

# end

# # plt.legend(loc="lower right",bbox_to_anchor =(-0.1,-0.05),frameon=false,fontsize=8,ncol=3) 
# plt.xlabel("Density / (mol/L)",fontsize=12)
# plt.ylabel("Temperature / K",fontsize=12)

# plt.savefig("all_compound_phase_envelopes.png",dpi=400)


In [130]:
# Add statistics to training data dataframe
for i = 1:nrow(training_data)
    
    cas_lookup = training_data[i,:CAS]
    index_in_processed_data_statistics = findfirst(processed_data_statistics.CAS .== cas_lookup)

    training_data[i,:p_sat_AAD] = processed_data_statistics[index_in_processed_data_statistics,:p_sat_AAD]
    training_data[i,:p_sat_AAD_outliers] = processed_data_statistics[index_in_processed_data_statistics,:p_sat_AAD_outliers]
    training_data[i,:rho_liq_AAD] = processed_data_statistics[index_in_processed_data_statistics,:rho_liq_AAD]
    training_data[i,:rho_liq_sat_AAD] = processed_data_statistics[index_in_processed_data_statistics,:rho_liq_sat_AAD]
    training_data[i,:rho_liq_sp_AAD] = processed_data_statistics[index_in_processed_data_statistics,:rho_liq_sp_AAD]
    training_data[i,:rho_vap_AAD_outliers] = processed_data_statistics[index_in_processed_data_statistics,:rho_vap_AAD_outliers]

    training_data[i,:p_sat_n_points] = processed_data_statistics[index_in_processed_data_statistics,:p_sat_n_points]
    training_data[i,:p_sat_n_points_outliers] = processed_data_statistics[index_in_processed_data_statistics,:p_sat_n_points_outliers]
    training_data[i,:rho_liq_n_points] = processed_data_statistics[index_in_processed_data_statistics,:rho_liq_n_points]
    training_data[i,:rho_liq_sat_n_points] = processed_data_statistics[index_in_processed_data_statistics,:rho_liq_sat_n_points]
    training_data[i,:rho_liq_sp_n_points] = processed_data_statistics[index_in_processed_data_statistics,:rho_liq_sp_n_points]
    training_data[i,:rho_vap_n_points_outliers] = processed_data_statistics[index_in_processed_data_statistics,:rho_vap_n_points_outliers]

end


In [127]:
# Data storage
CSV.write("training_data.csv", training_data) ;

In [129]:
training_data = CSV.read("training_data.csv",DataFrame)
num_rows = nrow(training_data)
rename!(training_data,:sat_temperatures_K=>:sat_temp_strings, :sat_pressures_MPa=>:sat_pressure_strings,
        :sat_volumes_liq_m3_per_mol=>:sat_vol_liq_strings,:sat_volumes_vap_m3_per_mol=>:sat_vol_vap_strings)

# Define the column names
array_cols_to_create = [:sat_temperatures_K, :sat_pressures_MPa, :sat_volumes_liq_m3_per_mol, :sat_volumes_vap_m3_per_mol]
string_columns = [:sat_temp_strings, :sat_pressure_strings, :sat_vol_liq_strings, :sat_vol_vap_strings]

# Initialize the columns with zeros
for col in array_cols_to_create
    training_data[!, col] .= fill([0.0], num_rows)
end

# Process and assign the values to the DataFrame
for (col, str_col) in zip(array_cols_to_create, string_columns)
    for i = 1:num_rows
        string_sq_brackets_removed = replace(training_data[i, str_col], r"[][]" => "")
        vector_of_floats = [parse(Float64, val) for val in split(string_sq_brackets_removed, ",")]
        training_data[i, col] = vector_of_floats
    end
end

# Remove the string columns
select!(training_data, Not(string_columns...)) ;

training_data

Row,species,CAS,isomeric_SMILES,family,Mw,interaction,source,critical_temperature_K,critical_pressure_MPa,critical_volume_m3_per_mol,p_sat_AAD,p_sat_AAD_outliers,rho_liq_AAD,rho_liq_sat_AAD,rho_liq_sp_AAD,rho_vap_AAD_outliers,p_sat_n_points,p_sat_n_points_outliers,rho_liq_n_points,rho_liq_sat_n_points,rho_liq_sp_n_points,rho_vap_n_points_outliers,sat_temperatures_K,sat_pressures_MPa,sat_volumes_liq_m3_per_mol,sat_volumes_vap_m3_per_mol
Unnamed: 0_level_1,String,String15,String,String31,Float64,String15,String31,Float64,Float64,Float64,Float64,Float64,Float64,Float64,Float64,Float64,Int64,Int64,Int64,Int64,Int64,Int64,Array…,Array…,Array…,Array…
1,methane,74-82-8,C,Alkanes,16.031,NONPOLAR,10.1021/acs.iecr.3c02255,191.453,4.68922e6,0.000108063,0.59,0.72,0.53,0.48,0.68,2.65,1211,1222,1126,856,270,4317,"[95.7267, 95.9186, 96.1104, 96.3023, 96.4941, 96.6859, 96.8778, 97.0696, 97.2614, 97.4533 … 189.727, 189.919, 190.111, 190.302, 190.494, 190.686, 190.878, 191.07, 191.262, 191.453]","[21706.6, 22184.2, 22670.1, 23164.7, 23667.8, 24179.7, 24700.4, 25230.1, 25768.8, 26316.7 … 4.46102e6, 4.48608e6, 4.51122e6, 4.53643e6, 4.56172e6, 4.58707e6, 4.6125e6, 4.63801e6, 4.66358e6, 4.68922e6]","[3.60443e-5, 3.60648e-5, 3.60854e-5, 3.61059e-5, 3.61265e-5, 3.61471e-5, 3.61678e-5, 3.61885e-5, 3.62092e-5, 3.62299e-5 … 8.20978e-5, 8.33085e-5, 8.46313e-5, 8.60919e-5, 8.77271e-5, 8.95939e-5, 9.17882e-5, 9.44977e-5, 9.82083e-5, 0.000108063]","[0.036283, 0.0355668, 0.0348676, 0.0341852, 0.0335189, 0.0328684, 0.0322333, 0.031613, 0.0310073, 0.0304156 … 0.00014731, 0.000144572, 0.000141735, 0.000138772, 0.000135648, 0.000132305, 0.000128648, 0.000124489, 0.000119342, 0.000108063]"
2,ammonia,7664-41-7,N,Inorganic compounds,17.027,ASSOCIATIVE,10.1021/acs.iecr.3c02255,423.884,1.50571e7,7.2694e-5,1.23,1.4,1.42,1.38,1.7,10.78,1082,1093,879,775,104,180,"[211.942, 212.367, 212.792, 213.216, 213.641, 214.066, 214.491, 214.915, 215.34, 215.765 … 420.062, 420.486, 420.911, 421.336, 421.761, 422.185, 422.61, 423.035, 423.46, 423.884]","[19918.2, 20497.6, 21091.0, 21698.6, 22320.8, 22957.8, 23609.9, 24277.4, 24960.5, 25659.5 … 1.4172e7, 1.42682e7, 1.43649e7, 1.44622e7, 1.456e7, 1.46583e7, 1.47572e7, 1.48566e7, 1.49566e7, 1.50571e7]","[2.43847e-5, 2.44004e-5, 2.44161e-5, 2.44319e-5, 2.44477e-5, 2.44635e-5, 2.44794e-5, 2.44952e-5, 2.45111e-5, 2.4527e-5 … 5.57947e-5, 5.65501e-5, 5.73779e-5, 5.82953e-5, 5.9327e-5, 6.05115e-5, 6.19137e-5, 6.36609e-5, 6.60837e-5, 7.2694e-5]","[0.0881662, 0.0858388, 0.0835837, 0.0813982, 0.07928, 0.0772267, 0.075236, 0.0733058, 0.0714339, 0.0696184 … 0.000101229, 9.91459e-5, 9.69995e-5, 9.47723e-5, 9.24394e-5, 8.99624e-5, 8.72763e-5, 8.42535e-5, 8.05634e-5, 7.2694e-5]"
3,ammonia-d3,13550-49-7,[2H]N([2H])[2H],Other compounds,17.027,ASSOCIATIVE,10.1021/acs.iecr.3c02255,419.98,1.47831e7,6.85203e-5,0.27,0.31,0.09,0.13,0.04,-1.0,231,232,20,12,8,-1,"[209.99, 210.411, 210.832, 211.253, 211.673, 212.094, 212.515, 212.936, 213.357, 213.777 … 416.193, 416.614, 417.034, 417.455, 417.876, 418.297, 418.718, 419.138, 419.559, 419.98]","[14942.5, 15384.8, 15838.2, 16302.8, 16778.9, 17266.7, 17766.5, 18278.4, 18802.7, 19339.6 … 1.39215e7, 1.40154e7, 1.41099e7, 1.42047e7, 1.43e7, 1.43957e7, 1.44919e7, 1.45885e7, 1.46856e7, 1.47831e7]","[1.9988e-5, 2.00015e-5, 2.00151e-5, 2.00286e-5, 2.00422e-5, 2.00558e-5, 2.00695e-5, 2.00831e-5, 2.00968e-5, 2.01105e-5 … 5.25051e-5, 5.32469e-5, 5.40563e-5, 5.49491e-5, 5.59483e-5, 5.70892e-5, 5.84318e-5, 6.00934e-5, 6.23784e-5, 6.85203e-5]","[0.11499, 0.111879, 0.108866, 0.105947, 0.103118, 0.100377, 0.0977211, 0.0951465, 0.0926506, 0.0902308 … 9.4244e-5, 9.23853e-5, 9.04688e-5, 8.84785e-5, 8.63914e-5, 8.4172e-5, 8.17604e-5, 7.90392e-5, 7.57036e-5, 6.85203e-5]"
4,water,7732-18-5,O,Inorganic compounds,18.011,ASSOCIATIVE,10.1021/acs.iecr.3c02255,677.938,3.02134e7,5.80502e-5,1.1,1.18,2.21,2.23,0.76,7.52,5870,5896,6342,6244,98,1827,"[338.969, 339.648, 340.327, 341.007, 341.686, 342.365, 343.045, 343.724, 344.403, 345.082 … 671.824, 672.503, 673.183, 673.862, 674.541, 675.22, 675.9, 676.579, 677.258, 677.938]","[25733.8, 26519.0, 27324.5, 28150.7, 28998.1, 29867.1, 30758.0, 31671.5, 32607.9, 33567.7 … 2.84252e7, 2.86202e7, 2.88161e7, 2.90129e7, 2.92107e7, 2.94093e7, 2.9609e7, 2.98095e7, 3.0011e7, 3.02134e7]","[1.81104e-5, 1.81216e-5, 1.81328e-5, 1.8144e-5, 1.81552e-5, 1.81664e-5, 1.81777e-5, 1.8189e-5, 1.82003e-5, 1.82116e-5 … 4.47011e-5, 4.53179e-5, 4.5991e-5, 4.67339e-5, 4.75657e-5, 4.85158e-5, 4.96343e-5, 5.10191e-5, 5.29245e-5, 5.80502e-5]","[0.108053, 0.105042, 0.102127, 0.0993058, 0.0965746, 0.0939302, 0.0913696, 0.0888898, 0.0864878, 0.084161 … 7.95434e-5, 7.79898e-5, 7.6388e-5, 7.47246e-5, 7.29804e-5, 7.11256e-5, 6.91103e-5, 6.68365e-5, 6.40496e-5, 5.80502e-5]"
5,tritium oxide,14940-65-9,[3H]O[3H],Other compounds,18.011,NONPOLAR,10.1021/acs.iecr.3c02255,706.752,3.89808e7,4.67452e-5,0.18,-1.0,0.79,0.79,-1.0,-1.0,7,-1,40,40,-1,-1,"[353.376, 354.084, 354.792, 355.5, 356.209, 356.917, 357.625, 358.333, 359.041, 359.749 … 700.378, 701.086, 701.795, 702.503, 703.211, 703.919, 704.627, 705.335, 706.044, 706.752]","[44165.7, 45487.5, 46842.3, 48230.8, 49653.7, 51111.5, 52605.0, 54134.8, 55701.7, 57306.2 … 3.66414e7, 3.68954e7, 3.71509e7, 3.74079e7, 3.76663e7, 3.79262e7, 3.81876e7, 3.84505e7, 3.87149e7, 3.89808e7]","[1.56883e-5, 1.56985e-5, 1.57087e-5, 1.57189e-5, 1.57291e-5, 1.57394e-5, 1.57496e-5, 1.57599e-5, 1.57702e-5, 1.57805e-5 … 3.59166e-5, 3.64002e-5, 3.69301e-5, 3.75174e-5, 3.81778e-5, 3.89362e-5, 3.9834e-5, 4.09529e-5, 4.25051e-5, 4.67452e-5]","[0.0663238, 0.0645207, 0.0627751, 0.0610849, 0.059448, 0.0578626, 0.0563268, 0.0548389, 0.0533971, 0.0519999 … 6.51626e-5, 6.38117e-5, 6.24207e-5, 6.09784e-5, 5.9469e-5, 5.78677e-5, 5.61328e-5, 5.41827e-5, 5.1805e-5, 4.67452e-5]"
6,hydrogen fluoride,7664-39-3,F,Inorganic compounds,20.006,DIPOLAR,10.1021/acs.iecr.3c02255,561.135,2.06211e7,6.78997e-5,4.81,5.44,8.36,8.41,8.23,22.26,277,279,97,73,24,360,"[280.567, 281.13, 281.692, 282.254, 282.816, 283.379, 283.941, 284.503, 285.065, 285.628 … 556.074, 556.637, 557.199, 557.761, 558.323, 558.886, 559.448, 560.01, 560.572, 561.135]","[63879.2, 65363.7, 66876.5, 68418.0, 69988.7, 71588.9, 73219.0, 74879.6, 76570.9, 78293.5 … 1.95217e7, 1.9642e7, 1.97627e7, 1.98839e7, 2.00056e7, 2.01278e7, 2.02504e7, 2.03735e7, 2.04971e7, 2.06211e7]","[2.13731e-5, 2.13859e-5, 2.13988e-5, 2.14117e-5, 2.14246e-5, 2.14376e-5, 2.14505e-5, 2.14635e-5, 2.14765e-5, 2.14895e-5 … 5.12082e-5, 5.19755e-5, 5.28143e-5, 5.37415e-5, 5.47809e-5, 5.59697e-5, 5.73704e-5, 5.91056e-5, 6.14929e-5, 6.78997e-5]","[0.036247, 0.0354898, 0.0347515, 0.0340314, 0.0333291, 0.0326441, 0.0319758, 0.0313239, 0.0306879, 0.0300672 … 9.42855e-5, 9.24064e-5, 9.04645e-5, 8.84431e-5, 8.6318e-5, 8.40522e-5, 8.15831e-5, 7.87881e-5, 7.53494e-5, 6.78997e-5]"
7,ethyne,74-86-2,C#C,Alkynes,26.016,NONPOLAR,10.1021/acs.iecr.3c02255,314.802,6.92998e6,0.000117565,0.82,1.64,1.0,0.34,1.22,-1.0,106,111,41,10,31,-1,"[157.401, 157.716, 158.032, 158.347, 158.663, 158.978, 159.293, 159.609, 159.924, 160.24 … 311.963, 312.278, 312.594, 312.909, 313.225, 313.54, 313.855, 314.171, 314.486, 314.802]","[11084.9, 11395.8, 11714.0, 12039.5, 12372.5, 12713.1, 13061.5, 13417.7, 13781.9, 14154.2 … 6.53342e6, 6.57657e6, 6.61995e6, 6.66355e6, 6.70738e6, 6.75144e6, 6.79573e6, 6.84025e6, 6.885e6, 6.92998e6]","[3.93553e-5, 3.93804e-5, 3.94056e-5, 3.94308e-5, 3.94561e-5, 3.94814e-5, 3.95067e-5, 3.9532e-5, 3.95574e-5, 3.95828e-5 … 9.00797e-5, 9.13107e-5, 9.26596e-5, 9.41544e-5, 9.58354e-5, 9.77649e-5, 0.000100048, 0.000102892, 0.000106833, 0.000117565]","[0.117585, 0.114595, 0.111695, 0.108882, 0.106152, 0.103504, 0.100933, 0.0984381, 0.0960161, 0.0936647 … 0.000163474, 0.000160144, 0.00015671, 0.000153143, 0.000149403, 0.000145427, 0.00014111, 0.000136244, 0.000130294, 0.000117565]"
8,hydrogen cyanide,74-90-8,C#N,Nitriles,27.011,DIPOLAR,10.1021/acs.iecr.3c02255,460.276,6.38909e6,0.000135455,4.43,4.49,1.2,1.23,0.63,-1.0,343,344,115,109,6,-1,"[230.138, 230.599, 231.06, 231.522, 231.983, 232.444, 232.905, 233.366, 233.828, 234.289 … 456.125, 456.587, 457.048, 457.509, 457.97, 458.431, 458.893, 459.354, 459.815, 460.276]","[2922.0, 3016.32, 3113.27, 3212.9, 3315.28, 3420.47, 3528.52, 3639.52, 3753.51, 3870.57 … 5.91889e6, 5.96934e6, 6.02023e6, 6.07155e6, 6.12331e6, 6.17553e6, 6.22821e6, 6.28136e6, 6.33498e6, 6.38909e6]","[3.6037e-5, 3.60602e-5, 3.60834e-5, 3.61066e-5, 3.61298e-5, 3.61531e-5, 3.61763e-5, 3.61996e-5, 3.6223e-5, 3.62463e-5 … 9.19905e-5, 9.37175e-5, 9.56356e-5, 9.77922e-5, 0.000100256, 0.000103135, 0.00010661, 0.000111039, 0.000117352, 0.000135455]","[0.653754, 0.634552, 0.615993, 0.598055, 0.580714, 0.563947, 0.547735, 0.532056, 0.516891, 0.502221 … 0.000221627, 0.000215107, 0.000208412, 0.000201494, 0.00019428, 0.000186662, 0.000178458, 0.000169306, 0.000158275, 0.000135455]"
9,carbon monoxide,630-08-0,[C-]#[O+],Inorganic compounds,27.995,NONPOLAR,10.1021/acs.iecr.3c02255,133.26,3.49266e6,0.000100479,1.97,2.45,0.55,0.5,0.63,0.38,220,227,144,88,56,9,"[66.6302, 66.7637, 66.8973, 67.0308, 67.1643, 67.2978, 67.4314, 67.5649, 67.6984, 67.832 … 132.059, 132.192, 132.326, 132.459, 132.593, 132.726, 132.86, 132.993, 133.127, 133.26]","[12160.5, 12448.8, 12742.6, 13042.0, 13347.1, 13658.0, 13974.7, 14297.3, 14625.9, 14960.6 … 3.31635e6, 3.33567e6, 3.35505e6, 3.37451e6, 3.39403e6, 3.41362e6, 3.43328e6, 3.45301e6, 3.4728e6, 3.49266e6]","[3.29573e-5, 3.2977e-5, 3.29967e-5, 3.30164e-5, 3.30362e-5, 3.3056e-5, 3.30758e-5, 3.30957e-5, 3.31156e-5, 3.31355e-5 … 7.6411e-5, 7.75205e-5, 7.87338e-5, 8.00747e-5, 8.15778e-5, 8.32965e-5, 8.53207e-5, 8.78265e-5, 9.12698e-5, 0.000100479]","[0.0451957, 0.044231, 0.043291, 0.0423751, 0.0414826, 0.0406127, 0.0397648, 0.0389382, 0.0381324, 0.0373467 … 0.000137801, 0.000135175, 0.000132456, 0.000129621, 0.000126634, 0.000123442, 0.000119956, 0.000116, 0.000111116, 0.000100479]"
10,nitrogen,7727-37-9,N#N,Elements,28.006,NONPOLAR,10.1021/acs.iecr.3c02255,126.413,3.38859e6,9.84356e-5,0.97,1.87,1.69,1.94,0.64,7.01,696,726,619,503,116,3467,"[63.2066, 63.3333, 63.46, 63.5866, 63.7133, 63.84, 63.9666, 64.0933, 64.22, 64.3466 … 125.273, 125.4, 125.527, 125.653, 125.78, 125.907, 126.033, 126.16, 126.287, 126.413]","[12716.3, 13012.2, 13313.7, 13620.7, 13933.5, 14252.1, 14576.5, 14906.9, 15243.3, 15585.8 … 3.21952e6, 3.23806e6, 3.25666e6, 3.27533e6, 3.29405e6, 3.31284e6, 3.33169e6, 3.3506e6, 3.36957e6, 3.38859e6]","[3.22924e-5, 3.23115e-5, 3.23306e-5, 3.23497e-5, 3.23689e-5, 3.23881e-5, 3.24073e-5, 3.24265e-5, 3.24458e-5, 3.24651e-5 … 7.484e-5, 7.59326e-5, 7.71268e-5, 7.8446e-5, 7.99241e-5, 8.1613e-5, 8.36007e-5, 8.60589e-5, 8.94329e-5, 9.84356e-5]","[0.0409757, 0.0401179, 0.0392818, 0.0384667, 0.0376721, 0.0368972, 0.0361416, 0.0354047, 0.0346859, 0.0339848 … 0.000134725, 0.000132178, 0.000129541, 0.000126789, 0.000123889, 0.00012079, 0.000117403, 0.000113556, 0.000108805, 9.84356e-5]"
