# 🔍 EcoAlert: NLP for Climate Emergency Tweets

This notebook uses NLP to classify tweets as either emergency-related or not using TF-IDF and an SVM classifier.

In [None]:
# Import libraries
import pandas as pd
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.model_selection import train_test_split
from sklearn.svm import LinearSVC
from sklearn.metrics import classification_report

In [None]:
# Load sample tweet dataset
df = pd.read_json('../data/tweets_sample.json')
df.head()

In [None]:
# Split features and labels
X = df['text']
y = df['label']  # 1 = emergency, 0 = normal

In [None]:
# TF-IDF vectorization
vectorizer = TfidfVectorizer(stop_words='english')
X_vec = vectorizer.fit_transform(X)

In [None]:
# Train-test split
X_train, X_test, y_train, y_test = train_test_split(X_vec, y, test_size=0.2, random_state=42)

In [None]:
# Train SVM classifier
clf = LinearSVC()
clf.fit(X_train, y_train)

In [None]:
# Evaluate model
y_pred = clf.predict(X_test)
print(classification_report(y_test, y_pred))