In [None]:
# Import necessary libraries
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.svm import SVC
from sklearn.preprocessing import StandardScaler
from sklearn.metrics import classification_report, confusion_matrix

# Assuming you have a dataset where 'X' contains the features and 'y' contains the labels (0 for legitimate, 1 for fraudulent)
# Replace this with your actual dataset loading code
# Example:
# df = pd.read_csv('your_dataset.csv')
# X = df.drop('label_column', axis=1)  # Features
# y = df['label_column']  # Labels

# Generate some sample data for demonstration
data = {
    'amount': [10.00, 20.00, 30.00, 40.00, 50.00, 60.00, 70.00, 80.00],
    'location': ['US', 'CA', 'US', 'US', 'CA', 'US', 'CA', 'US'],
    'time_of_day': ['morning', 'afternoon', 'evening', 'morning', 'afternoon', 'evening', 'morning', 'afternoon'],
    'label': [0, 1, 0, 0, 1, 0, 1, 0]  # 0 - legitimate, 1 - fraudulent
}
df = pd.DataFrame(data)
X = df.drop('label', axis=1)
y = df['label']

# Convert categorical variables into dummy/indicator variables
X = pd.get_dummies(X, columns=['location', 'time_of_day'])

# Split data into training and testing sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=0)

# Feature scaling for optimal performance of SVC
sc = StandardScaler()
X_train = sc.fit_transform(X_train)
X_test = sc.transform(X_test)

# Initialize SVC classifier
classifier = SVC(kernel='linear', random_state=0)

# Train the classifier
classifier.fit(X_train, y_train)

# Predictions on the test set
y_pred = classifier.predict(X_test)

# Evaluating the model
print("Confusion Matrix:")
print(confusion_matrix(y_test, y_pred))
print("\nClassification Report:")
print(classification_report(y_test, y_pred))


Confusion Matrix:
[[1 0]
 [0 1]]

Classification Report:
              precision    recall  f1-score   support

           0       1.00      1.00      1.00         1
           1       1.00      1.00      1.00         1

    accuracy                           1.00         2
   macro avg       1.00      1.00      1.00         2
weighted avg       1.00      1.00      1.00         2



In [2]:
# Import necessary libraries
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import classification_report, confusion_matrix, accuracy_score

# Assuming you have a dataset where 'X' contains the features and 'y' contains the labels (0 for legitimate, 1 for fraudulent)
# Replace this with your actual dataset loading code
# Example:
df = pd.read_csv('/content/sample_data/onlinefraud.csv')
# X = df.drop('label_column', axis=1)  # Features
# y = df['label_column']  # Labels

# Generate some sample data for demonstration
data = {
    'amount': [10.00, 20.00, 30.00, 40.00, 50.00, 60.00, 70.00, 80.00],
    'location': ['US', 'CA', 'US', 'US', 'CA', 'US', 'CA', 'US'],
    'time_of_day': ['morning', 'afternoon', 'evening', 'morning', 'afternoon', 'evening', 'morning', 'afternoon'],
    'label': [0, 1, 0, 0, 1, 0, 1, 0]  # 0 - legitimate, 1 - fraudulent
}
df = pd.DataFrame(data)
X = df.drop('label', axis=1)
y = df['label']

# Convert categorical variables into dummy/indicator variables
X = pd.get_dummies(X, columns=['location', 'time_of_day'])

# Split data into training and testing sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=0)

# Initialize RandomForestClassifier
classifier = RandomForestClassifier(n_estimators=100, random_state=0)

# Train the classifier
classifier.fit(X_train, y_train)

# Predictions on the test set
y_pred = classifier.predict(X_test)

# Evaluating the model
print("Confusion Matrix:")
print(confusion_matrix(y_test, y_pred))
print("\nClassification Report:")
print(classification_report(y_test, y_pred))
print("\nAccuracy Score:", accuracy_score(y_test, y_pred))


Confusion Matrix:
[[1 0]
 [0 1]]

Classification Report:
              precision    recall  f1-score   support

           0       1.00      1.00      1.00         1
           1       1.00      1.00      1.00         1

    accuracy                           1.00         2
   macro avg       1.00      1.00      1.00         2
weighted avg       1.00      1.00      1.00         2


Accuracy Score: 1.0


In [1]:
# Import necessary libraries
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LogisticRegression
from sklearn.preprocessing import StandardScaler
from sklearn.metrics import classification_report, confusion_matrix

# Assuming you have a dataset where 'X' contains the features and 'y' contains the labels (0 for legitimate, 1 for fraudulent)
# Replace this with your actual dataset loading code
# Example:
df = pd.read_csv('/content/sample_data/onlinefraud.csv')
# X = df.drop('label_column', axis=1)  # Features
# y = df['label_column']  # Labels

# Generate some sample data for demonstration
data = {
    'amount': [10.00, 20.00, 30.00, 40.00, 50.00, 60.00, 70.00, 80.00],
    'location': ['US', 'CA', 'US', 'US', 'CA', 'US', 'CA', 'US'],
    'time_of_day': ['morning', 'afternoon', 'evening', 'morning', 'afternoon', 'evening', 'morning', 'afternoon'],
    'label': [0, 1, 0, 0, 1, 0, 1, 0]  # 0 - legitimate, 1 - fraudulent
}
df = pd.DataFrame(data)
X = df.drop('label', axis=1)
y = df['label']

# Convert categorical variables into dummy/indicator variables
X = pd.get_dummies(X, columns=['location', 'time_of_day'])

# Split data into training and testing sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=0)

# Feature scaling for optimal performance of Logistic Regression
sc = StandardScaler()
X_train = sc.fit_transform(X_train)
X_test = sc.transform(X_test)

# Initialize Logistic Regression classifier
classifier = LogisticRegression(random_state=0)

# Train the classifier
classifier.fit(X_train, y_train)

# Predictions on the test set
y_pred = classifier.predict(X_test)

# Evaluating the model
print("Confusion Matrix:")
print(confusion_matrix(y_test, y_pred))
print("\nClassification Report:")
print(classification_report(y_test, y_pred))


Confusion Matrix:
[[1 0]
 [1 0]]

Classification Report:
              precision    recall  f1-score   support

           0       0.50      1.00      0.67         1
           1       0.00      0.00      0.00         1

    accuracy                           0.50         2
   macro avg       0.25      0.50      0.33         2
weighted avg       0.25      0.50      0.33         2



  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
