**Install Pycaret**

In [1]:
!pip install pycaret

Collecting pycaret
  Downloading pycaret-3.1.0-py3-none-any.whl (483 kB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m483.9/483.9 kB[0m [31m3.8 MB/s[0m eta [36m0:00:00[0m
Collecting pyod>=1.0.8 (from pycaret)
  Downloading pyod-1.1.0.tar.gz (153 kB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m153.4/153.4 kB[0m [31m6.6 MB/s[0m eta [36m0:00:00[0m
[?25h  Preparing metadata (setup.py) ... [?25l[?25hdone
Collecting category-encoders>=2.4.0 (from pycaret)
  Downloading category_encoders-2.6.2-py2.py3-none-any.whl (81 kB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m81.8/81.8 kB[0m [31m8.3 MB/s[0m eta [36m0:00:00[0m
Collecting deprecation>=2.1.0 (from pycaret)
  Downloading deprecation-2.1.0-py2.py3-none-any.whl (11 kB)
Collecting xxhash (from pycaret)
  Downloading xxhash-3.3.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (194 kB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m194.1/194.1 

In [2]:
from google.colab import drive
drive.mount('/content/gdrive')

Mounted at /content/gdrive


In [4]:
import pandas as pd
air_quality = pd.read_csv("/content/gdrive/MyDrive/Datasets/AirQualityUCI.csv")

In [5]:
air_quality.shape

(9357, 15)

In [6]:
air_quality = air_quality.head(500)

**Import Library**

In [7]:
from pycaret.anomaly import *

**Setup**

In [8]:
anomaly_setup = setup(air_quality,session_id = 123)

Unnamed: 0,Description,Value
0,Session id,123
1,Original data shape,"(500, 15)"
2,Transformed data shape,"(500, 59)"
3,Numeric features,13
4,Categorical features,2
5,Preprocess,True
6,Imputation type,simple
7,Numeric imputation,mean
8,Categorical imputation,mode
9,Maximum one-hot encoding,-1


In [9]:
models()

Unnamed: 0_level_0,Name,Reference
ID,Unnamed: 1_level_1,Unnamed: 2_level_1
abod,Angle-base Outlier Detection,pyod.models.abod.ABOD
cluster,Clustering-Based Local Outlier,pycaret.internal.patches.pyod.CBLOFForceToDouble
cof,Connectivity-Based Local Outlier,pyod.models.cof.COF
iforest,Isolation Forest,pyod.models.iforest.IForest
histogram,Histogram-based Outlier Detection,pyod.models.hbos.HBOS
knn,K-Nearest Neighbors Detector,pyod.models.knn.KNN
lof,Local Outlier Factor,pyod.models.lof.LOF
svm,One-class SVM detector,pyod.models.ocsvm.OCSVM
pca,Principal Component Analysis,pyod.models.pca.PCA
mcd,Minimum Covariance Determinant,pyod.models.mcd.MCD


**Create Model**

In [10]:
iforest = create_model("iforest")
print(iforest)

Processing:   0%|          | 0/3 [00:00<?, ?it/s]

IForest(behaviour='new', bootstrap=False, contamination=0.05,
    max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=-1,
    random_state=123, verbose=0)


In [11]:
anomaly_model = assign_model(iforest)

**Evaluate Model**

In [14]:
evaluate_model(iforest)

interactive(children=(ToggleButtons(description='Plot Type:', icons=('',), options=(('Pipeline Plot', 'pipelin…

**Predictions**

In [16]:
predictions = predict_model(iforest, data=air_quality)

In [17]:
predictions

Unnamed: 0,Date_3/10/2004,Date_3/11/2004,Date_3/12/2004,Date_3/13/2004,Date_3/14/2004,Date_3/15/2004,Date_3/16/2004,Date_3/17/2004,Date_3/18/2004,Date_3/19/2004,...,NOx(GT),PT08.S3(NOx),NO2(GT),PT08.S4(NO2),PT08.S5(O3),T,RH,AH,Anomaly,Anomaly_Score
0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,166.0,1056.0,113.0,1692.0,1268.0,13.6,48.9,0.7578,0,-0.070164
1,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,103.0,1174.0,92.0,1559.0,972.0,13.3,47.7,0.7255,0,-0.064270
2,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,131.0,1140.0,114.0,1555.0,1074.0,11.9,54.0,0.7502,0,-0.060989
3,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,172.0,1092.0,122.0,1584.0,1203.0,11.0,60.0,0.7867,0,-0.074403
4,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,131.0,1205.0,116.0,1490.0,1110.0,11.2,59.6,0.7888,0,-0.051177
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
495,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,181.0,872.0,125.0,1576.0,1093.0,10.4,74.4,0.9384,0,-0.052305
496,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,144.0,957.0,118.0,1498.0,965.0,11.5,71.0,0.9582,0,-0.050653
497,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,140.0,902.0,109.0,1579.0,1004.0,12.2,70.0,0.9924,0,-0.049394
498,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,204.0,779.0,123.0,1772.0,1166.0,12.3,73.3,1.0442,0,-0.044365
