# Industry Sprint - The Six ⁶𓅓 (Team 9)

### EDA

In [3]:
import pandas as pd
import plotly.express as px

# Sample data for Age Group in a dictionary format
data_age = {
    'Age Group': ['18-34', '35-54', '55+'],
    'Trust': [77, 81, 89],
    'Do not trust': [23, 0, 8],
    'Don\'t know': [0, 19, 3]
}

data_gender = {
    'Gender': ['Female', 'Male'],
    'Trust': [87, 88],
    'Do not trust': [9, 7],
    'Don\'t know': [4, 5]
}

# Create DataFrames from the data dictionaries
df_age = pd.DataFrame(data_age)
df_gender = pd.DataFrame(data_gender)

# Melt the DataFrames to have 'Trust Level' as a separate column
df_age_melted = df_age.melt(id_vars='Age Group', var_name='Trust Level', value_name='Percentage')
df_gender_melted = df_gender.melt(id_vars='Gender', var_name='Trust Level', value_name='Percentage')

# Plot the stacked bar chart using Plotly Express
fig_age = px.bar(df_age_melted, x='Age Group', y='Percentage', color='Trust Level', barmode='group',
                 title='Trust in Public Organizations by Age Group',
                 labels={'Percentage': 'Percentage (%)', 'Age Group': 'Age Group', 'Trust Level': 'Trust Level'})

fig_gender = px.bar(df_gender_melted, x='Gender', y='Percentage', color='Trust Level', barmode='group',
                    title='Trust in Public Organizations by Gender',
                    labels={'Percentage': 'Percentage (%)', 'Gender': 'Gender', 'Trust Level': 'Trust Level'})

# Show the plots
fig_age.show()
fig_gender.show()


In [5]:
import pandas as pd
import plotly.graph_objects as go

# Data in dictionary format
data = {
    'Age Group': ['18-34', '35-54', '55-69', '70+'],
    'I feel more comfortable shopping in person than online': [77, 100, 84, 86],
    'I usually get help from family and friends when it comes to using the internet': [100, 84, 75, 56],
    'I find using online devices such as smartphones difficult': [49, 39, 73, 70],
    "I don't tend to use email": [48, 46, 67, 77],
    "I don't feel comfortable doing tasks such as online banking": [100, 90, 71, 46]
}

# Create a DataFrame from the data
df = pd.DataFrame(data)

# Define the Age Groups as the x-axis
x = df['Age Group']

# Create traces for each statement and gender
traces = []
for column in df.columns[1:]:
    trace = go.Bar(
        x=x,
        y=df[column],
        name=column,
    )
    traces.append(trace)

# Define the layout
layout = go.Layout(
    title='Comparison of Responses by Age Group',
    xaxis=dict(title='Age Group'),
    yaxis=dict(title='Percentage'),
    barmode='group',
)

# Create the figure
fig = go.Figure(data=traces, layout=layout)

# Show the plot
fig.show()

In [17]:
import pandas as pd
import plotly.express as px

# Data in dictionary format
data = {
    'Gender': ['Female', 'Male'],
    'I feel more comfortable shopping in person than online': [88, 84],
    'I usually get help from family and friends when it comes to using the internet': [74,65],
    'I find using online devices such as smartphones difficult': [68, 69],
    "I don't tend to use email": [63,73],
    "I don't feel comfortable doing tasks such as online banking": [69, 61]
}
# Create a DataFrame from the data
df = pd.DataFrame(data)

# Define the Age Groups as the x-axis
x = df['Gender']

# Create traces for each statement and gender
traces = []
for column in df.columns[1:]:
    trace = go.Bar(
        x=x,
        y=df[column],
        name=column,
    )
    traces.append(trace)

# Define the layout
layout = go.Layout(
    title='Comparison of Responses by Gender',
    xaxis=dict(title='Gender'),
    yaxis=dict(title='Percentage'),
    barmode='group',
)

# Create the figure
fig = go.Figure(data=traces, layout=layout)

# Show the plot
fig.show()



In [20]:
import pandas as pd
import plotly.express as px

# Sample data for Age Group and Gender in a dictionary format
data_age = {
    'Age Group': ['18-34', '35-54', '55+'],
    'Strongly agree': [23, 29, 52],
    'Agree': [25, 17, 19],
    'Neither agree nor disagree': [0, 0, 2],
    'Disagree': [25, 14, 12],
    'Strongly disagree': [27, 40, 15]
}

data_gender = {
    'Gender': ['Female', 'Male'],
    'Strongly agree': [46, 52],
    'Agree': [17, 21],
    'Neither agree nor disagree': [2, 1],
    'Disagree': [11, 15],
    'Strongly disagree': [24, 10]
}

# Convert the dictionaries to DataFrames
df_age = pd.DataFrame(data_age)
df_gender = pd.DataFrame(data_gender)

# Melt the DataFrames to create long-format data for plotting
df_age_melted = df_age.melt(id_vars='Age Group', var_name='Response', value_name='Percentage')
df_gender_melted = df_gender.melt(id_vars='Gender', var_name='Response', value_name='Percentage')

# Plot the grouped bar chart for Age Group
fig_age = px.bar(df_age_melted, x='Age Group', y='Percentage', color='Response',
                 barmode='group', title='Agreement with "I don\'t tend to use email" by Age Group',
                 labels={'Percentage': 'Percentage', 'Response': 'Agreement'})

# Plot the grouped bar chart for Gender
fig_gender = px.bar(df_gender_melted, x='Gender', y='Percentage', color='Response',
                    barmode='group', title='Agreement with "I don\'t tend to use email" by Gender',
                    labels={'Percentage': 'Percentage', 'Response': 'Agreement'})

# Show both plots side by side
fig_age.show()
fig_gender.show()


In [21]:
import pandas as pd
import plotly.express as px

# Data in dictionary format
data = {
    'Age (groups)': ['18-34', '35-54', '55-69', '70+'],
    'Strongly agree': [75, 55, 52, 41],
    'Agree': [25, 29, 23, 14],
    'Neither agree nor disagree': [0, 0, 1, 3],
    'Disagree': [0, 0, 7, 3],
    'Strongly disagree': [0, 2, 12, 12],
    "Don't do this online activity": [0, 0, 4, 19]
}

# Create a DataFrame from the data
df = pd.DataFrame(data)

# Melt the DataFrame to convert it to long format
df_melted = df.melt(id_vars='Age (groups)', var_name='Response', value_name='Percentage')

# Plot the grouped bar chart using Plotly Express
fig = px.bar(df_melted, x='Age (groups)', y='Percentage', color='Response', barmode='group',
             title='Agreement with Internet Use Statements by Age Group',
             labels={'Percentage': 'Percentage (%)', 'Age (groups)': 'Age Group', 'Response': 'Agreement'})

# Show the plot
fig.show()


# Data for Gender
data_gender = {
    'Gender': ['Female', 'Male'],
    'Strongly agree': [52, 46],
    'Agree': [22, 19],
    'Neither agree nor disagree': [1, 2],
    'Disagree': [5, 2],
    'Strongly disagree': [9, 14],
    "Don't do this online activity": [8, 10]
}

# Create a DataFrame from the gender data
df_gender = pd.DataFrame(data_gender)

# Melt the DataFrame to convert it to long format
df_gender_melted = df_gender.melt(id_vars='Gender', var_name='Response', value_name='Percentage')

# Plot the grouped bar chart using Plotly Express
fig_gender = px.bar(df_gender_melted, x='Gender', y='Percentage', color='Response', barmode='group',
                    title='Agreement with Internet Use Statements by Gender',
                    labels={'Percentage': 'Percentage (%)', 'Gender': 'Gender', 'Response': 'Agreement'})

# Show the plot
fig_gender.show()


In [22]:
import pandas as pd
import plotly.express as px

# Data in dictionary format
data = {
    'Age (groups)': ['18-34', '35-54', '55-69', '70+'],
    'Strongly agree': [0, 32, 49, 57],
    'Agree': [49, 7, 24, 13],
    'Neither agree nor disagree': [0, 7, 1, 1],
    'Disagree': [0, 26, 5, 0],
    'Strongly disagree': [51, 14, 11, 10],
    "Don't do this online activity": [0, 0, 7, 13],
    "Don't know": [0, 14, 4, 7]
}

# Create a DataFrame from the data
df = pd.DataFrame(data)

# Melt the DataFrame to convert it to long format
df_melted = df.melt(id_vars='Age (groups)', var_name='Response', value_name='Percentage')

# Plot the grouped bar chart using Plotly Express
fig = px.bar(df_melted, x='Age (groups)', y='Percentage', color='Response', barmode='group',
             title='Agreement with "I find using online devices such as smartphones difficult" by Age Group',
             labels={'Percentage': 'Percentage (%)', 'Age (groups)': 'Age Group', 'Response': 'Agreement'})

# Show the plot
fig.show()


# Data for Gender
data_gender = {
    'Gender': ['Female', 'Male'],
    'Strongly agree': [47, 49],
    'Agree': [21, 20],
    'Neither agree nor disagree': [1, 2],
    'Disagree': [6, 2],
    'Strongly disagree': [12, 13],
    "Don't do this online activity": [8, 8],
    "Don't know": [5, 6]
}

# Create a DataFrame from the gender data
df_gender = pd.DataFrame(data_gender)

# Melt the DataFrame to convert it to long format
df_gender_melted = df_gender.melt(id_vars='Gender', var_name='Response', value_name='Percentage')

# Plot the grouped bar chart using Plotly Express
fig_gender = px.bar(df_gender_melted, x='Gender', y='Percentage', color='Response', barmode='group',
                    title='Agreement with "I find using online devices such as smartphones difficult" by Gender',
                    labels={'Percentage': 'Percentage (%)', 'Gender': 'Gender', 'Response': 'Agreement'})

# Show the plot
fig_gender.show()

In [32]:
import pandas as pd
import plotly.express as px

# Data in dictionary format
data = {
    'Age (groups)': ['18-34', '35-54',  '55-69', '70+'],
    'Total': [12, 17, 93, 72],
    'Strongly agree': [52, 98, 64, 78],
    'Agree': [25, 2, 21, 7],
    'Neither agree nor disagree': [0, 0, 2, 0],
    'Disagree': [23, 0, 2, 3],
    'Strongly disagree': [0, 0, 7, 1],
    "Don't do this online activity": [0, 0, 5, 6],
    "Don't know": [0, 0, 1, 4],
}

# Create a DataFrame from the data
df = pd.DataFrame(data)

# Melt the DataFrame to convert it to long format
df_melted = df.melt(id_vars='Age (groups)', var_name='Response', value_name='Percentage')

# Plot the stacked bar chart using Plotly Express
fig = px.bar(df_melted, x='Age (groups)', y='Percentage', color='Response',  barmode='group',
             title='Agreement with "I feel more comfortable shopping in person than online" by Age Group',
             labels={'Percentage': 'Percentage (%)', 'Age (groups)': 'Age Group', 'Response': 'Agreement'})

# Show the plot
fig.show()

# Data for Gender
data_gender = {
    'Gender': ['Female', 'Male'],
    'Total': [121, 77],
    'Strongly agree': [78, 70],
    'Agree': [18, 10],
    'Neither agree nor disagree': [1, 1],
    'Disagree': [3, 8],
    'Strongly disagree': [5, 2],
    "Don't do this online activity": [5, 4],
    "Don't know": [1, 2],
}

# Create a DataFrame from the gender data
df_gender = pd.DataFrame(data_gender)

# Melt the DataFrame to convert it to long format
df_gender_melted = df_gender.melt(id_vars='Gender', var_name='Response', value_name='Percentage')

# Plot the stacked bar chart using Plotly Express
fig_gender = px.bar(df_gender_melted, x='Gender', y='Percentage', color='Response', barmode='group',
                    title='Agreement with "I feel more comfortable shopping in person than online" by Gender',
                    labels={'Percentage': 'Percentage (%)', 'Gender': 'Gender', 'Response': 'Agreement'})

# Show the plot
fig_gender.show()


In [31]:
import pandas as pd
import plotly.express as px

# Data in dictionary format
data = {
    'Age (groups)': ['18-34', '35-54', '55-69', '70+'],
    'I would rather not provide data about the region I live in, even if it means the system could not be checked to see if it\'s unfair to people from different groups': [0, 0, 27, 27],
    'I would rather the system be checked to see if it is unfair for different groups, and would be comfortable with sharing information about the region I live in to enable that': [0, 36, 63, 47],
    "Don't know": [0, 64, 9, 26],
}

# Create a DataFrame from the data
df = pd.DataFrame(data)

# Melt the DataFrame to convert it to long format
df_melted = df.melt(id_vars='Age (groups)', var_name='Response', value_name='Percentage')

# Plot the grouped bar chart using Plotly Express
fig = px.bar(df_melted, x='Age (groups)', y='Percentage', color='Response', barmode='group',
             title='Views on Providing Region Data for Checking Unfair System Outcomes by Age Group',
             labels={'Percentage': 'Percentage (%)', 'Age (groups)': 'Age Group', 'Response': 'View'})

# Show the plot
fig.show()

# Data for Gender
data_gender = {
    'Gender': ['Female', 'Male'],
    'I would rather not provide data about the region I live in, even if it means the system could not be checked to see if it\'s unfair to people from different groups': [26, 24],
    'I would rather the system be checked to see if it is unfair for different groups, and would be comfortable with sharing information about the region I live in to enable that': [53, 62],
    "Don't know": [21, 14],
}

# Create a DataFrame from the gender data
df_gender = pd.DataFrame(data_gender)

# Melt the DataFrame to convert it to long format
df_gender_melted = df_gender.melt(id_vars='Gender', var_name='Response', value_name='Percentage')

# Plot the grouped bar chart using Plotly Express
fig_gender = px.bar(df_gender_melted, x='Gender', y='Percentage', color='Response', barmode='group',
                    title='Views on Providing Region Data for Checking Unfair System Outcomes by Gender',
                    labels={'Percentage': 'Percentage (%)', 'Gender': 'Gender', 'Response': 'View'})

# Show the plot
fig_gender.show()

In [35]:
import pandas as pd
import plotly.express as px

# Data in dictionary format
data = {
    'Age (groups)': ['18-34', '35-54', '55-69', '70+', 'Female', 'Male'],
    'Very negative': [0, 0, 5, 2, 6, 1],
    'Slightly negative': [0, 0, 8, 6, 12, 2],
    'Neither positive nor negative': [0, 65, 3, 24, 25, 11],
    'Slightly positive': [0, 18, 40, 17, 21, 41],
    'Very positive': [0, 17, 44, 51, 37, 46],
}

# Create a DataFrame from the data
df = pd.DataFrame(data)

# Melt the DataFrame to convert it to long format
df_melted = df.melt(id_vars='Age (groups)', var_name='Response', value_name='Percentage')

# Plot the stacked bar chart using Plotly Express
fig = px.bar(df_melted, x='Age (groups)', y='Percentage', color='Response', barmode='group',
             title='Impact of Artificial Intelligence on Healthcare by Age Group',
             labels={'Percentage': 'Percentage (%)', 'Age (groups)': 'Age Group', 'Response': 'Impact'})

# Show the plot
fig.show()

# Data for Gender
data_gender = {
    'Gender': ['Female', 'Male'],
    'Very negative': [6, 1],
    'Slightly negative': [12, 2],
    'Neither positive nor negative': [25, 11],
    'Slightly positive': [21, 41],
    'Very positive': [37, 46],
}

# Create a DataFrame from the gender data
df_gender = pd.DataFrame(data_gender)

# Melt the DataFrame to convert it to long format
df_gender_melted = df_gender.melt(id_vars='Gender', var_name='Response', value_name='Percentage')

# Plot the stacked bar chart using Plotly Express
fig_gender = px.bar(df_gender_melted, x='Gender', y='Percentage', color='Response', barmode='group',
                    title='Impact of Artificial Intelligence on Healthcare by Gender',
                    labels={'Percentage': 'Percentage (%)', 'Gender': 'Gender', 'Response': 'Impact'})

# Show the plot
fig_gender.show()


In [38]:
import pandas as pd
import plotly.express as px

# Data in dictionary format
data = {
    'Age (groups)': ['18-34', '35-54', '55-69', '70+', 'Female', 'Male'],
    'NET: Heard of': [75, 69, 65, 59, 60, 71],
    'NET: Could explain at least partially': [0, 43, 33, 23, 22, 37],
}

# Create a DataFrame from the data
df = pd.DataFrame(data)

# Melt the DataFrame to convert it to long format
df_melted = df.melt(id_vars='Age (groups)', var_name='Response', value_name='Percentage')

# Plot the stacked bar chart using Plotly Express
fig = px.bar(df_melted, x='Age (groups)', y='Percentage', color='Response', barmode='group',
             title='Awareness and Understanding of Artificial Intelligence (AI)',
             labels={'Percentage': 'Percentage (%)', 'Age (groups)': 'Age Group', 'Response': 'Response'})

# Show the plot
fig.show()


In [53]:
import pandas as pd
import plotly.express as px

# Data in dictionary format
data = {
    'Situations': ['Everyday Effortlessness', 'Personalized Healthcare',
                   'Job opportunities',
                   'Cutting Costs with Ease', 'Assessing Fairness in Society'],
    'Neither positive nor negative (3.0)': [14, 17, 18, 25, 16],
    'Positive': [77, 73, 52, 48, 37],
    'Negative': [8, 10, 30, 25, 43],
}

# Create a DataFrame from the data
df = pd.DataFrame(data)

# Melt the DataFrame to convert it to long format
df_melted = df.melt(id_vars='Situations', var_name='Response', value_name='Percentage')

# Plot the grouped bar chart using Plotly Express
fig = px.bar(df_melted, x='Situations', y='Percentage', color='Response', barmode='group',
             title='Perceived Impact of Artificial Intelligence (AI) for Different Situations',
             labels={'Percentage': 'Percentage (%)', 'Situations': 'Situations', 'Response': 'Impact Level'})

# Show the plot
fig.show()


In [44]:
import pandas as pd
import plotly.express as px

# Data in dictionary format
data = {
    'Rating': [0, 2, 4, 5, 6, 7, 8, 9, 10],
    'Knowledge about how data is used and collected in day-to-day life': [4, 2, 0, 22, 20, 9, 28, 12, 4],
    'Read, seen or heard anything about data being used in P6M': [0, 1, 9, 27, 26, 15, 14, 0, 5],
    'Awareness of AI': [2, 2, 8, 24, 20, 12, 22, 5, 6],
    'Trust social media companies to act in best interest': [0, 0, 0, 0, 0, 0, 0, 0, 0],
    'Trust big technology companies to act in best interest': [2, 2, 9, 28, 24, 15, 12, 5, 13],
}

# Create a DataFrame from the data
df = pd.DataFrame(data)

# Melt the DataFrame to convert it to long format
df_melted = df.melt(id_vars='Rating', var_name='Category', value_name='Percentage')

# Plot the scatter plot using Plotly Express
fig = px.scatter(df_melted, x='Rating', y='Percentage', color='Category',
                 labels={'Percentage': 'Percentage (%)', 'Rating': 'Rating (0-10)',
                         'Category': 'Category of Impact'},
                 title='Impact of Artificial Intelligence (AI) on Different Categories of Society')

# Show the plot
fig.show()


In [52]:
import pandas as pd
import plotly.express as px

# Data in dictionary format
data = {
    'Rating': [0, 2, 4, 5, 6, 7, 8, 9, 10],
    'Awareness of AI': [2, 2, 8, 24, 20, 12, 22, 5, 6],
    'Trust big technology companies to act in best interest': [2, 2, 9, 28, 24, 15, 12, 5, 13],
}

# Create a DataFrame from the data
df = pd.DataFrame(data)

# Melt the DataFrame to convert it to long format
df_melted = df.melt(id_vars='Rating', var_name='Category', value_name='Percentage')

# Plot the stacked bar chart using Plotly Express
fig = px.bar(df_melted, x='Rating', y='Percentage', color='Category', barmode='group',
             labels={'Percentage': 'Percentage (%)', 'Rating': 'Rating (0-10)',
                     'Category': 'Category of Impact'},
             title='Awareness of Artificial Intelligence (AI) on Trust in Big Companies')

# Show the plot
fig.show()


In [49]:
import pandas as pd
import plotly.express as px

# Data in dictionary format
data = {
    'Knowledge about how data is used and collected in day-to-day life': [80, 10],
    'Read, seen or heard anything about data being used in P6M': [69, 9],
    'Awareness of AI': [76, 5],
    'Trust social media companies to act in best interest': [62, 27],
    'Trust big technology companies to act in best interest': [73, 10],
}

# Create a DataFrame from the data
df = pd.DataFrame(data)

# Melt the DataFrame to convert it to long format
df_melted = df.melt(value_name='Percentage', var_name='Category')

# Plot the stacked bar chart using Plotly Express
fig = px.bar(df_melted, x='Category', y='Percentage', color='Category', barmode='group',
             labels={'Percentage': 'Percentage (%)', 'Category': 'Category of Impact'},
             title='Impact of Artificial Intelligence (AI) on Healthcare for People Like You and Your Family')

# Show the plot
fig.show()
