<a href="https://colab.research.google.com/github/GEOFFREY-MO/My-data/blob/main/realapp.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [None]:
import pandas as pd
import numpy as np
import plotly.express as px
import streamlit as st

def data_analysis(data_path):
    # Load the dataset
    data = pd.read_csv(data_path)

    # Check for missing values
    missing_values = data.isnull().sum()
    st.write(f"Missing values:\n{missing_values}")

    # Descriptive statistics
    st.write("Descriptive statistics:")
    st.write(data.describe())

    # Correlation analysis
    correlation_matrix = data.corr()
    st.write("Correlation matrix:")
    st.write(correlation_matrix)

    # Find the strongest correlation
    strongest_correlation = correlation_matrix.max()
    correlated_variables = correlation_matrix.idxmax()
    st.write("Strongest correlation:", str(strongest_correlation), ".3f", "between", correlated_variables)


    # Make comments about the data
    if strongest_correlation.any() > 0.7:

        st.write("There is a strong positive correlation between the variables. This means that they tend to move in the same direction.")
    elif strongest_correlation < -0.7:
        st.write("There is a strong negative correlation between the variables. This means that they tend to move in opposite directions.")
    else:
        st.write("There is a weak correlation between the variables. This means that they do not tend to move in the same direction.")
      # Select the variables to plot
    x_variable = st.selectbox("X-axis variable", data.columns)
    y_variable = st.selectbox("Y-axis variable", data.columns)

    # Create the scatter plot
    fig = px.scatter(data, x=x_variable, y=y_variable)

    # Display the plot in Streamlit
    st.plotly_chart(fig)
st.title("Data Analysis App")

# Upload the dataset
uploaded_file = st.file_uploader("Choose a dataset file")

# If a dataset is uploaded, perform the data analysis
if uploaded_file is not None:
    data_analysis(uploaded_file.name)
else:
    st.write("Please upload a dataset file to perform the data analysis.")