# Chickpea example

## Setup

In [6]:
import os
from mtml_model import mtmlModel
from dataset import Data, CVset
from pandas import read_csv
from optimisation import *
from semopy.efa import explore_cfa_model
from utils import *

path_data = 'data_cicer/'
file_phens = path_data + 'data_phens.txt'
file_snps = path_data + 'snp_2579_renamed.txt'
snp_pref = 'Ca'


## Read data

In [3]:
data_phens = read_csv(file_phens, sep='\t', index_col=0)

print(data_phens.isna().sum(axis=0))

# Remove missing data
data_phens = data_phens.loc[data_phens.isna().sum(axis=1) == 0, :]
data_phens = data_phens.iloc[:, list(data_phens.nunique() > 2)]
data_snps = read_csv(file_snps, sep='\t', index_col=0)

# Create data object
data = Data(d_snps=data_snps, d_phens=data_phens)
print(data.n_samples)

Germ            0
GBegF           0
BegFEndF        0
EndFBegM        0
BegMEndM        0
FloCol          0
StemCol         0
BushShape       0
LeafSize        0
FlowStemCol     0
AscoRes         0
StemBr          0
StemL1ord       0
StemBr1ord      0
StemBr2ord      0
PodD            0
PodS            0
Height          0
Hlp             0
NoPodsWeight    0
PodsWeight      0
PodsNumber      0
SeedsNumber     0
SeedsWeight     0
PodShape        0
PodLength       0
PodWidth        0
SeedShape       0
SeedCol         0
Seed1000W       0
dtype: int64
404


## Create model

In [4]:
model = mtmlModel(data=data)

SEM model was not defined


In [7]:
model.get_lat_struct()
model.show_mod()

Type of the latent structure is unconnect
# Model mod0
F0 =~ PodsWeight + PodsNumber + SeedsNumber + SeedsWeight
# Model mod1
F1 =~ NoPodsWeight + PodShape + PodLength + PodWidth + Seed1000W
# Model mod2
F2 =~ FloCol + StemCol + SeedShape + SeedCol
# Model mod3
F3 =~ BegFEndF + EndFBegM
# Model mod4
F4 =~ Height + Hlp


## Add SNPs

In [8]:
model = model.add_snps(snp_pref=snp_pref)

F0
PodsNumber
SeedsWeight
PodsWeight
SeedsNumber
F0 =~ 1.0 * PodsWeight
F0 =~ 0.9997553747355805 * PodsNumber
F0 =~ 0.9071818056783406 * SeedsNumber
F0 =~ 1.0759638553617537 * SeedsWeight
F0
F0 =~ 1.0 * PodsWeight
F0 =~ 0.9997553747355805 * PodsNumber
F0 =~ 0.9071818056783406 * SeedsNumber
F0 =~ 1.0759638553617537 * SeedsWeight
-----------
16.829923656290944 16.829923656290944
Skip 0 SNPs
0.7189625998202747
16.829923656290944
0.7178690211083589
8.306973317872174
13.469395010682476 13.469395010682476
Skip 423 SNPs
0.7423524955828835
13.469395010682476
0.7180327645599238
4.324537680509
11.606186203742588 11.606186203742588
Skip 855 SNPs
0.7573263477964307
11.606186203742588
0.7179516697183779
2.6163558255534625
10.700739607585295 10.700739607585295
Skip 1006 SNPs
0.7660398966927211
10.700739607585295
0.7178979415213913
1.785389679413349
10.071292874504355 10.071292874504355
Skip 1046 SNPs
0.868058063920019
10.071292874504355
0.7182471031545754
1.4029834003126744
9.436412182502607 9.43641



0.03759819244963225
3.142862359918542
0.0020946195744051543
0.44977110943860676
3.063996332633419 3.063996332633419
Skip 1516 SNPs
0.03962637976141181
3.063996332633419
0.002146871785424276
0.447272708450984
F3 =~ 1.0 * BegFEndF
F3 =~ -0.8258969791854806 * EndFBegM
F3 ~ 0.6087237997763335*Ca7_32482435
F3 ~ -0.49489714656397876*Ca7_36747540
F3 ~ 0.41595465967365775*Ca3_19353482
F3 ~ -0.37868104870249386*Ca3_9387546
F3 ~ 0.3382923031488677*Ca6_53592514
F3 ~ 0.33260993629367647*Ca3_28437425
F3 ~ -0.26303926302872976*Ca2_27434688
F3 ~ 0.2769515036653856*Ca1_5480709
F3 ~ 0.2521410734598684*Ca6_15283408
F3 ~ -0.2586705782226478*Ca2_35983700
-----------
-----------
F4
Height
Hlp
F4 =~ 1.0 * Height
F4 =~ 0.596711045528099 * Hlp
F4
F4 =~ 1.0 * Height
F4 =~ 0.596711045528099 * Hlp
-----------
16.821502530226052 16.821502530226056
Skip 0 SNPs
0.00021912807151980296
16.821502530226056
4.7155992312308825e-05
8.378456180666763
9.850589977601322 9.850589977601322
Skip 142 SNPs
0.0015938292489048322
9