In [6]:
import pandas as pd
import numpy as np
from sklearn.model_selection import train_test_split
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.ensemble import GradientBoostingRegressor
from sklearn.pipeline import Pipeline
from sklearn.metrics import mean_squared_error


In [3]:
file_path = "C:/Users/Arkats/Downloads/ielts_writing_dataset.csv/ielts_writing_dataset.csv"
data = pd.read_csv(file_path)

In [7]:
required_columns = ['Essay', 'Overall']
data = data.dropna(subset=required_columns)

In [8]:
data['Overall'] = pd.to_numeric(data['Overall'], errors='coerce')
data = data.dropna(subset=['Overall'])

In [9]:
X = data['Essay']
y = data['Overall']

In [10]:
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

In [11]:
pipeline = Pipeline([
    ('tfidf', TfidfVectorizer(max_features=5000)), 
    ('model', GradientBoostingRegressor(random_state=42)) 
])


In [12]:
pipeline.fit(X_train, y_train)

In [13]:
y_pred = pipeline.predict(X_test)

In [14]:
mse = mean_squared_error(y_test, y_pred)
print(f"Mean Squared Error: {mse}")

Mean Squared Error: 0.8427866167880784


In [20]:
new_essays = [
    """Climate change has become a significant topic of debate in recent years, with some considering it the most critical environmental challenge of our time. However, others argue that other ecological issues, such as deforestation and water scarcity, pose equally severe threats. This essay will discuss both perspectives before presenting my view that climate change is indeed the most pressing concern due to its far-reaching and multifaceted impact.
    On the one hand, proponents of the view that climate change is the primary environmental issue emphasize its global implications. Rising temperatures lead to more frequent and severe weather events, including hurricanes, droughts, and floods, which disrupt ecosystems and human societies alike. Furthermore, the melting of polar ice caps contributes to rising sea levels, threatening coastal communities and biodiversity. Such wide-ranging consequences indicate that climate change affects not only the environment but also the global economy, food security, and human health.
    On the other hand, some argue that other environmental problems demand equal attention. For instance, deforestation not only accelerates climate change by reducing the number of carbon-absorbing trees but also endangers countless species, leading to a loss of biodiversity. Similarly, water scarcity affects millions of people worldwide, particularly in developing countries, where access to clean water remains a persistent challenge. These issues are more immediate for certain populations and, therefore, may appear more urgent to address.
    Despite the validity of these concerns, I believe that climate change overshadows other environmental issues due to its interconnected nature. Climate change exacerbates problems like deforestation, as changing weather patterns can make forests more vulnerable to wildfires. Similarly, it worsens water scarcity through prolonged droughts in arid regions. By addressing climate change, many of these related issues can also be mitigated, making it the most logical starting point for global environmental action.
    In conclusion, while problems such as deforestation and water scarcity are undeniably critical, climate change remains the most significant environmental challenge due to its comprehensive impact and the way it amplifies other issues. International cooperation and immediate action are essential to mitigate its effects and ensure a sustainable future for humanity."""
]
predictions = pipeline.predict(new_essays)
print("Predicted Overall Scores:", predictions)

Predicted Overall Scores: [6.82086195]


In [18]:
data

Unnamed: 0,Task_Type,Question,Essay,Examiner_Commen,Task_Response,Coherence_Cohesion,Lexical_Resource,Range_Accuracy,Overall
0,1,The bar chart below describes some changes abo...,"Between 1995 and 2010, a study was conducted r...",,,,,,5.5
1,2,Rich countries often give money to poorer coun...,Poverty represents a worldwide crisis. It is t...,,,,,,6.5
2,1,The bar chart below describes some changes abo...,The left chart shows the population change hap...,,,,,,5.0
3,2,Rich countries often give money to poorer coun...,Human beings are facing many challenges nowada...,,,,,,5.5
4,1,The graph below shows the number of overseas v...,Information about the thousands of visits from...,,,,,,7.0
...,...,...,...,...,...,...,...,...,...
1430,2,Without capital punishment our lives are less ...,Serious crimes need capital punishment so that...,"You should rewrite it, giving more thought to ...",,,,,5.0
1431,2,Some people think that they can learn better b...,It is certainly said that learning is an ongoi...,Where are the paragraphs in this essay? You mu...,,,,,5.0
1432,2,Nowadays people like to change their day by da...,popular hobbies rather than their individual a...,I suggest that you read several essays that ha...,,,,,5.0
1433,2,Universities should allocate the same amount o...,"Yes, I do feel that universities should have a...","Your essay too short, the introduction is good...",,,,,5.0
