<a href="https://colab.research.google.com/github/Avaniharetlia/MLPROJECTS/blob/main/Pandas.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [None]:
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_squared_error
from sklearn.impute import SimpleImputer
from sklearn.preprocessing import StandardScaler

# Load the dataset
data = pd.read_csv('/content/Salary_Data.csv')

# Inspect the data
print("First 5 rows:\n", data.head())

# Check column names
print("\nColumn Names:", data.columns.tolist())

# Use correct column names (assuming they are 'YearsExperience' and 'Salary')
X = data[['Years of Experience']]  # Features
y = data['Salary']            # Target

# Handle missing values (if any) in X
imputer_X = SimpleImputer(strategy='mean')
X = imputer_X.fit_transform(X)

# Handle missing values (if any) in y
imputer_y = SimpleImputer(strategy='mean')
y = imputer_y.fit_transform(y.values.reshape(-1, 1)).ravel()


# Standardize the feature
scaler = StandardScaler()
X_scaled = scaler.fit_transform(X)

# Split data into train and test
X_train, X_test, y_train, y_test = train_test_split(X_scaled, y, test_size=0.2, random_state=42)

# Create and train the model
model = LinearRegression()
model.fit(X_train, y_train)

# Predict on test data
y_pred = model.predict(X_test)

# Evaluate the model
mse = mean_squared_error(y_test, y_pred)
print(f"\nMean Squared Error: {mse:.2f}")

# Predict salary for 5 years of experience
new_data = pd.DataFrame({'Years of Experience': [5]})
new_data_scaled = scaler.transform(new_data)
predicted_salary = model.predict(new_data_scaled)

print(f"\nPredicted Salary for 5 Years Experience: ${predicted_salary[0]:.2f}")

First 5 rows:
     Age  Gender Education Level          Job Title  Years of Experience  \
0  32.0    Male      Bachelor's  Software Engineer                  5.0   
1  28.0  Female        Master's       Data Analyst                  3.0   
2  45.0    Male             PhD     Senior Manager                 15.0   
3  36.0  Female      Bachelor's    Sales Associate                  7.0   
4  52.0    Male        Master's           Director                 20.0   

     Salary  
0   90000.0  
1   65000.0  
2  150000.0  
3   60000.0  
4  200000.0  

Column Names: ['Age', 'Gender', 'Education Level', 'Job Title', 'Years of Experience', 'Salary']

Mean Squared Error: 927079077.87

Predicted Salary for 5 Years Experience: $93665.78


