In [None]:
import pandas as pd
import numpy as np
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.preprocessing import LabelEncoder
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import accuracy_score

In [None]:
# Load the data into a pandas DataFrame
df = pd.read_csv("Anime_data.csv")
df =df.dropna()
# Encode the categorical data
le = LabelEncoder()
df["Genre"] = le.fit_transform(df["Genre"])
df["Type"] = le.fit_transform(df["Type"])
df["Producer"] = le.fit_transform(df["Producer"])
df["Studio"] = le.fit_transform(df["Studio"])

# Convert the text data into numerical representations
vectorizer = TfidfVectorizer()
df["Title"] = vectorizer.fit_transform(df["Title"]).getnnz()
df["Synopsis"] = vectorizer.fit_transform(df["Synopsis"]).getnnz()


# Bin the target variable into 5 categorical bins
df['Rating'] = pd.cut(df['Rating'], bins=[0, 2, 4, 6, 8, 10], labels=[1, 2, 3, 4, 5], include_lowest=True)
# Convert the binned target variable into categorical data
df['Rating'] = df['Rating'].astype('category')

# Split the data into training and testing sets
X = df[["Title", "Genre", "Synopsis", "Type", "Producer", "Studio"]]
y = df["Rating"]
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)


# Train the random forest classifier on the training set
model = RandomForestClassifier()
model.fit(X_train, y_train)



# Evaluate the model on the testing set
y_pred = model.predict(X_test)
accuracy = accuracy_score(y_test, y_pred)
print("Accuracy:", accuracy)


Accuracy: 0.7979910714285714


In [None]:
df.head()

Unnamed: 0,Anime_id,Title,Genre,Synopsis,Type,Producer,Studio,Rating,ScoredBy,Popularity,Members,Episodes,Source,Aired,Link
0,1,17376,12,299581,5,467,476,5,363889.0,39.0,704490.0,26.0,Original,"Apr 3, 1998 to Apr 24, 1999",https://myanimelist.net/anime/1/Cowboy_Bebop
1,5,17376,918,299581,0,1784,91,5,111187.0,475.0,179899.0,1.0,Original,"Sep 1, 2001",https://myanimelist.net/anime/5/Cowboy_Bebop__...
2,6,17376,780,299581,5,2219,277,5,197451.0,158.0,372709.0,26.0,Manga,"Apr 1, 1998 to Sep 30, 1998",https://myanimelist.net/anime/6/Trigun
3,7,17376,617,299581,5,467,476,4,31875.0,1278.0,74889.0,26.0,Original,"Jul 2, 2002 to Dec 24, 2002",https://myanimelist.net/anime/7/Witch_Hunter_R...
5,15,17376,927,299581,5,1985,437,5,48765.0,888.0,106468.0,145.0,Manga,"Apr 6, 2005 to Mar 19, 2008",https://myanimelist.net/anime/15/Eyeshield_21
