Dataset appended to javascript_snippets.csv


In [20]:
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.feature_extraction.text import CountVectorizer
from sklearn.pipeline import Pipeline
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import accuracy_score

# Load the dataset
data = pd.read_csv("javascript_snippets.csv")

# Split data into input (X) and output (y)
X = data["keyword"]
y = data["code"]

# Split the dataset into training and testing sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Define a pipeline to convert keywords to numerical features and train a random forest classifier
pipeline = Pipeline([
    ("vectorizer", CountVectorizer()),
    ("model", RandomForestClassifier(random_state=42))
])

# Train the model
pipeline.fit(X_train, y_train)

# Evaluate the model
train_accuracy = accuracy_score(y_train, pipeline.predict(X_train))
test_accuracy = accuracy_score(y_test, pipeline.predict(X_test))
print("Training accuracy:", train_accuracy)
print("Testing accuracy:", test_accuracy)

# Example inference
keyword_input = "fetch  "
predicted_code = pipeline.predict([keyword_input])
print("Predicted code:", predicted_code[0])


Training accuracy: 1.0
Testing accuracy: 0.0
Predicted code: fetch('https://api.example.com/data')
  .then(response => response.json())
  .then(data => console.log(data))
  .catch(error => console.error('Error:', error));


In [14]:
from sklearn.pipeline import Pipeline
from sklearn.feature_extraction.text import CountVectorizer
from sklearn.ensemble import RandomForestClassifier
import joblib

# Assuming pipeline is your trained model
joblib.dump(pipeline, 'model.pkl')


['model.pkl']