# Network Intrusion Detection System using Machine Learning
This notebook demonstrates how to build a network intrusion detection system (NIDS) using a machine learning model on the Kaggle dataset.

In [None]:
# Install necessary packages (if running in cloud environment like IBM Watson Studio)
# !pip install pandas scikit-learn matplotlib seaborn

import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import classification_report, confusion_matrix, accuracy_score


In [None]:
# Load the dataset
df = pd.read_csv("Test_data.csv")  
df.head()


In [None]:
# Encode labels and preprocess data
from sklearn.preprocessing import LabelEncoder

df.fillna(0, inplace=True)
le = LabelEncoder()
df['label'] = le.fit_transform(df['class'])  # assuming 'class' is the target column

X = df.drop(columns=['class', 'label'])  # Features
y = df['label']  # Encoded target

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=42)


In [None]:
# Train a Random Forest model
model = RandomForestClassifier(n_estimators=100, random_state=42)
model.fit(X_train, y_train)

y_pred = model.predict(X_test)


In [None]:
# Evaluate the model
print("Accuracy:", accuracy_score(y_test, y_pred))
print("\nClassification Report:\n", classification_report(y_test, y_pred))


In [None]:
# Plot confusion matrix
cm = confusion_matrix(y_test, y_pred)
plt.figure(figsize=(10, 6))
sns.heatmap(cm, annot=True, fmt='d', cmap='Blues')
plt.title('Confusion Matrix')
plt.xlabel('Predicted')
plt.ylabel('Actual')
plt.show()
