In [1]:
# Import pandas
import pandas as pd
# Import the required dependencies from sklearn
from sklearn.model_selection import train_test_split
from sklearn.pipeline import Pipeline
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.svm import LinearSVC

# Set the column width to view the text message data.
pd.set_option('max_colwidth', 200)

# Import Gradio
import gradio as gr

  from .autonotebook import tqdm as notebook_tqdm


In [2]:
def sms_classification(sms_text_df):
    """
    Perform SMS classification using a pipeline with TF-IDF vectorization and Linear Support Vector Classification.

    Parameters:
    - sms_text_df (pd.DataFrame): DataFrame containing 'text_message' and 'label' columns for SMS classification.

    Returns:
    - text_clf (Pipeline): Fitted pipeline model for SMS classification.

    This function takes a DataFrame with 'text_message' and 'label' columns, splits the data into
    training and testing sets, builds a pipeline with TF-IDF vectorization and Linear Support Vector
    Classification, and fits the model to the training data. 
    The fitted pipeline is returned to make future predictions.
    """
    # Set the features variable to the text message column.
    features = sms_text_df['text_message']

    # Set the target variable to the "label" column.
    target = sms_text_df['label']


    # Split data into training and testing and set the test_size = 33%
    # Set the features variable to the text message. 
    X = sms_text_df['text_message']  
# Set the target variable to the "label" column.
    y = sms_text_df['label']
    X_train, X_test, y_train, y_test = train_test_split(features, target, test_size=0.33, random_state=42)


    # Build a pipeline to transform the test set to compare to the training set.
    text_clf = Pipeline([('tfidf', TfidfVectorizer(stop_words='english')),
                     ('clf', LinearSVC()),
])
    text_clf.fit(X_train, y_train)

    # Fit the model to the transformed training data and return model.
    return text_clf

In [3]:
# Load the dataset into a DataFrame
sms_text_df = pd.read_csv('diamonds.csv')
sms_text_df.head()

Unnamed: 0.1,Unnamed: 0,carat,cut,color,clarity,depth,table,price,x,y,z
0,1,0.23,Ideal,E,SI2,61.5,55.0,326,3.95,3.98,2.43
1,2,0.21,Premium,E,SI1,59.8,61.0,326,3.89,3.84,2.31
2,3,0.23,Good,E,VS1,56.9,65.0,327,4.05,4.07,2.31
3,4,0.29,Premium,I,VS2,62.4,58.0,334,4.2,4.23,2.63
4,5,0.31,Good,J,SI2,63.3,58.0,335,4.34,4.35,2.75


In [4]:
# Call the sms_classification function with the DataFrame and set the result to the "text_clf" variable
text_clf = sms_classification(sms_text_df)

KeyError: 'text_message'

In [None]:
# Create a function called `sms_prediction` that takes in the SMS text and predicts the whether the text is "not spam" or "spam". 
# The function should return the SMS message, and say whether the text is "not spam" or "spam".
def sms_prediction(text):
    """
    Predict the spam/ham classification of a given text message using a pre-trained model.

    Parameters:
    - text (str): The text message to be classified.

    Returns:
    - str: A message indicating whether the text message is classified as spam or not.

    This function takes a text message and a pre-trained pipeline model, then predicts the
    spam/ham classification of the text. The result is a message stating whether the text is
    classified as spam or not.
    """
    # Create a variable that will hold the prediction of a new text.
    prediction = model.predict([text])

    # Using a conditional if the prediction is "ham" return the message:
    # f'The text message: "{text}", is not spam.' Else, return f'The text message: "{text}", is spam.'
    if prediction[0] == 'ham':
        # If the prediction is "ham", return a message stating the text is not spam
        return f'The text message: "{text}", is not spam.'
    else:
        # If the prediction is "spam", return a message stating the text is spam
        return f'The text message: "{text}", is spam.'

In [None]:
import gradio as gr

# Define the sms_app function
def sms_app():
    """
    Create an SMS app using Gradio Interface.

    This function creates an interface with a textbox for inputs and an output for the prediction.
    """
    # Define the function to predict the classification of an SMS text using the pre-trained model.
    def predict_sms(text):
        # Use the sms_prediction function with the pre-trained model (text_clf) and the input text
        return sms_prediction(text, text_clf)

    # Create a Gradio Interface
    iface = gr.Interface(
        fn=predict_sms,  # Function to run on input
        inputs=gr.Textbox(lines=2, label="Enter SMS Text"),  # Input textbox with label
        outputs=gr.Textbox(label="Prediction"),  # Output textbox with label
        title="SMS Spam Detector",  # Title of the app
        description="Enter an SMS text message to predict whether it's spam or not!"
    )

    # Launch the Gradio app
    iface.launch()

# Call the sms_app function to create and launch the app
sms_app()


Running on local URL:  http://127.0.0.1:7860

To create a public link, set `share=True` in `launch()`.


In [None]:
import gradio as gr

# Define some random text messages
text_1 = "You are a lucky winner of $5000!!"
text_2 = "You won 2 free tickets to the Super Bowl."
text_3 = "You won 2 free tickets to the Super Bowl. Text us to claim your prize."
text_4 = "Thanks for registering. Text 4343 to receive free updates on Medicare."

# Test the random text messages using the pre-trained model and print predictions
print(f"Prediction for text_1: {text_clf.predict([text_1])[0]}")
print(f"Prediction for text_2: {text_clf.predict([text_2])[0]}")
print(f"Prediction for text_3: {text_clf.predict([text_3])[0]}")
print(f"Prediction for text_4: {text_clf.predict([text_4])[0]}")

# Define the function that predicts whether an SMS text is spam or not using the pre-trained model
def predict_sms(text):
    # Use the pre-trained model (`text_clf`) to make the prediction
    prediction = text_clf.predict([text])
    # Return the classification result: "spam" or "not spam"
    return f"The message: '{text}' is classified as: '{prediction[0]}'"

# Create the Gradio interface
iface = gr.Interface(
    fn=predict_sms,  # Function to run on input
    inputs=gr.Textbox(lines=2, label="Enter SMS Text"),  # Input textbox with a label
    outputs=gr.Textbox(label="Prediction"),  # Output textbox with a label
    title="SMS Spam Detector",  # Title of the application
    description="Enter an SMS text message to predict whether it's spam or not!"
)

# Launch the Gradio app
iface.launch()


Prediction for text_1: ham
Prediction for text_2: ham
Prediction for text_3: spam
Prediction for text_4: spam
Running on local URL:  http://127.0.0.1:7861

To create a public link, set `share=True` in `launch()`.




In [None]:
# Create a sms_app that takes a textbox for the inputs and has a textbox for the output.  
# Povide labels for each textbox. 
# Create some random text messages. 
text_1 = """You are a lucky winner of $5000!!"""
text_2 = """You won 2 free tickets to the Super Bowl."""
text_3 = """You won 2 free tickets to the Super Bowl text us to claim your prize"""
text_4 = """Thanks for registering. Text 4343 to receive free updates on medicare"""

print(text_clf.predict([text_1]))
print(text_clf.predict([text_2]))
print(text_clf.predict([text_3]))
print(text_clf.predict([text_4]))
# Launch the app.
iface.launch()
sms_app()


['ham']
['ham']
['spam']
['spam']
Rerunning server... use `close()` to stop if you need to change `launch()` parameters.
----

To create a public link, set `share=True` in `launch()`.


Running on local URL:  http://127.0.0.1:7862

To create a public link, set `share=True` in `launch()`.


## Test the following text messages. 

---

1. You are a lucky winner of $5000!
2. You won 2 free tickets to the Super Bowl.
3. You won 2 free tickets to the Super Bowl text us to claim your prize.
4. Thanks for registering. Text 4343 to receive free updates on medicare.