<a href="https://colab.research.google.com/github/hajibeevi/genai/blob/main/bioreactor_eff_prediction_project.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [1]:
# Install necessary packages
!pip install -q scikit-learn pandas

# Import libraries
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LogisticRegression
from sklearn.metrics import accuracy_score

# Simulated dataset for bioreactor efficiency
data = {
    'temperature': [30, 35, 37, 25, 40, 32, 28, 33, 34, 36],
    'ph': [7.0, 6.8, 7.2, 7.5, 6.5, 7.0, 7.3, 6.9, 7.1, 6.8],
    'oxygen_concentration': [5.0, 4.8, 5.2, 5.5, 4.6, 5.1, 4.9, 5.0, 5.3, 4.7],
    'substrate_concentration': [15, 16, 14, 13, 15, 16, 14, 13, 15, 16],
    'efficiency': [1, 0, 1, 0, 1, 1, 0, 1, 1, 0]  # 1 = High Efficiency, 0 = Low Efficiency
}

# Create DataFrame
df = pd.DataFrame(data)

# Features and target variable
X = df[['temperature', 'ph', 'oxygen_concentration', 'substrate_concentration']]
y = df['efficiency']

# Split dataset into training and testing sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=42)

# Train a Logistic Regression model
model = LogisticRegression()
model.fit(X_train, y_train)

# Make predictions on the test set
y_pred = model.predict(X_test)

# Evaluate the model's accuracy
accuracy = accuracy_score(y_test, y_pred)
print(f"Model Accuracy: {accuracy:.2f}")

# Predict efficiency for new conditions
new_conditions = [[32, 7.0, 5.0, 15]]  # New bioreactor conditions
prediction = model.predict(new_conditions)
print(f"Predicted Efficiency: {'High' if prediction[0] == 1 else 'Low'}")


Model Accuracy: 0.33
Predicted Efficiency: Low


