# **departments**

In [3]:
#Food and Beverages Domestic
import pandas as pd
from scipy import stats

# Load your data
data = pd.read_csv('/content/statdata.csv')

# List of airlines to test
airlines = ['Avianca', 'Spirit Airlines', 'LAN Airlines']

# Initialize a dictionary to store results
t_test_results = {}

# Loop through each airline and perform the tests
for airline in airlines:
    # Filter for current airline's negative domestic flights
    airline_filter = (data['Airline Name'].str.contains(airline, case=False, na=False)) & \
                     (data['flight_type'] == 'Domestic')
    airline_data = data[airline_filter]
    airline_avg_sentiment = airline_data['Food & Beverages'].mean()
    airline_obs = len(airline_data)

    # Filter for other airlines' negative domestic flights
    other_airlines_filter = (~data['Airline Name'].str.contains(airline, case=False, na=False)) & \
                            (data['flight_type'] == 'Domestic')

    other_airlines_data = data[other_airlines_filter]
    other_airlines_avg_sentiment = other_airlines_data['Food & Beverages'].mean()
    other_airlines_observations = len(other_airlines_data)

    # Perform t-test
    t_stat, p_value = stats.ttest_ind(airline_data['Food & Beverages'],
                                      other_airlines_data['Food & Beverages'],
                                      equal_var=False)

    # Calculate one-tail p-value
    one_tail_p_value = p_value / 2

    # Store results in the dictionary
    t_test_results[airline] = {
        't_stat': t_stat,
        'p_value': p_value,
        'one_tail_p_value': one_tail_p_value,
        'airline_obs': airline_obs,
        'other_airlines_observations': other_airlines_observations,
        'airline_avg_sentiment': airline_avg_sentiment,
        'other_airlines_avg_sentiment': other_airlines_avg_sentiment
    }

# Print the results
for airline, results in t_test_results.items():
    print(f"Results for {airline}:")
    print(f"Observations: {results['airline_obs']}")
    print(f"Average Sentiment: {results['airline_avg_sentiment']}")
    print(f"Other Airlines Observations: {results['other_airlines_observations']}")
    print(f"Other Airlines Average Sentiment: {results['other_airlines_avg_sentiment']}")
    print(f"T-Statistic: {results['t_stat']}")
    print(f"P-Value: {results['p_value']}")
    print(f"One-Tail P-Value: {results['one_tail_p_value']}")
    print("\n")  # Adds a newline for better readability

Results for Avianca:
Observations: 3
Average Sentiment: 1.6666666666666667
Other Airlines Observations: 1216
Other Airlines Average Sentiment: 2.3963815789473686
T-Statistic: -1.0931806874417027
P-Value: 0.3879261444713149
One-Tail P-Value: 0.19396307223565745


Results for Spirit Airlines:
Observations: 86
Average Sentiment: 1.941860465116279
Other Airlines Observations: 1133
Other Airlines Average Sentiment: 2.4289496910856134
T-Statistic: -4.214248363762742
P-Value: 5.3905756352200393e-05
One-Tail P-Value: 2.6952878176100197e-05


Results for LAN Airlines:
Observations: 3
Average Sentiment: 1.3333333333333333
Other Airlines Observations: 1216
Other Airlines Average Sentiment: 2.3972039473684212
T-Statistic: -3.1754703628292607
P-Value: 0.08426111198043293
One-Tail P-Value: 0.042130555990216464




In [4]:
#Food and Beverages International

# List of airlines to test
airlines = ['Avianca', 'US Airways', 'Flair Airlines']

# Initialize a dictionary to store results
t_test_results = {}

# Loop through each airline and perform the tests
for airline in airlines:
    # Filter for current airline's negative domestic flights
    airline_filter = (data['Airline Name'].str.contains(airline, case=False, na=False)) & \
                     (data['flight_type'] == 'International')
    airline_data = data[airline_filter]
    airline_avg_sentiment = airline_data['Food & Beverages'].mean()
    airline_obs = len(airline_data)

    # Filter for other airlines' negative domestic flights
    other_airlines_filter = (~data['Airline Name'].str.contains(airline, case=False, na=False)) & \
                            (data['flight_type'] == 'International')
    other_airlines_data = data[other_airlines_filter]
    other_airlines_avg_sentiment = other_airlines_data['Food & Beverages'].mean()
    other_airlines_observations = len(other_airlines_data)

    # Perform t-test
    t_stat, p_value = stats.ttest_ind(airline_data['Food & Beverages'],
                                      other_airlines_data['Food & Beverages'],
                                      equal_var=False)

    # Calculate one-tail p-value
    one_tail_p_value = p_value / 2

    # Store results in the dictionary
    t_test_results[airline] = {
        't_stat': t_stat,
        'p_value': p_value,
        'one_tail_p_value': one_tail_p_value,
        'airline_obs': airline_obs,
        'other_airlines_observations': other_airlines_observations,
        'airline_avg_sentiment': airline_avg_sentiment,
        'other_airlines_avg_sentiment': other_airlines_avg_sentiment
    }

# Print the results
for airline, results in t_test_results.items():
    print(f"Results for {airline}:")
    print(f"Observations: {results['airline_obs']}")
    print(f"Average Sentiment: {results['airline_avg_sentiment']}")
    print(f"Other Airlines Observations: {results['other_airlines_observations']}")
    print(f"Other Airlines Average Sentiment: {results['other_airlines_avg_sentiment']}")
    print(f"T-Statistic: {results['t_stat']}")
    print(f"P-Value: {results['p_value']}")
    print(f"One-Tail P-Value: {results['one_tail_p_value']}")
    print("\n")  # Adds a newline for better readability

Results for Avianca:
Observations: 25
Average Sentiment: 1.6
Other Airlines Observations: 1344
Other Airlines Average Sentiment: 2.5558035714285716
T-Statistic: -5.1336872563439755
P-Value: 2.3741340551004567e-05
One-Tail P-Value: 1.1870670275502283e-05


Results for US Airways:
Observations: 10
Average Sentiment: 1.7
Other Airlines Observations: 1359
Other Airlines Average Sentiment: 2.5445180279617365
T-Statistic: -3.212813042297379
P-Value: 0.010102068704995013
One-Tail P-Value: 0.005051034352497506


Results for Flair Airlines:
Observations: 4
Average Sentiment: 1.5
Other Airlines Observations: 1365
Other Airlines Average Sentiment: 2.5413919413919412
T-Statistic: -2.077353059113774
P-Value: 0.12838437886434426
One-Tail P-Value: 0.06419218943217213




Seat Comfort

In [5]:
#Seat Comfort Domestic

# List of airlines to test
airlines = ['Allegiant Air', 'Frontier Airlines', 'Spirit Airlines']

# Initialize a dictionary to store results
t_test_results = {}

# Loop through each airline and perform the tests
for airline in airlines:
    # Filter for current airline's negative domestic flights
    airline_filter = (data['Airline Name'].str.contains(airline, case=False, na=False)) & \
                     (data['flight_type'] == 'Domestic')
    airline_data = data[airline_filter]
    airline_avg_sentiment = airline_data['Seat Comfort'].mean()
    airline_obs = len(airline_data)

    # Filter for other airlines' negative domestic flights
    other_airlines_filter = (~data['Airline Name'].str.contains(airline, case=False, na=False)) & \
                            (data['flight_type'] == 'Domestic')
    other_airlines_data = data[other_airlines_filter]
    other_airlines_avg_sentiment = other_airlines_data['Seat Comfort'].mean()
    other_airlines_observations = len(other_airlines_data)

    # Perform t-test
    t_stat, p_value = stats.ttest_ind(airline_data['Seat Comfort'],
                                      other_airlines_data['Seat Comfort'],
                                      equal_var=False)

    # Calculate one-tail p-value
    one_tail_p_value = p_value / 2

    # Store results in the dictionary
    t_test_results[airline] = {
        't_stat': t_stat,
        'p_value': p_value,
        'one_tail_p_value': one_tail_p_value,
        'airline_obs': airline_obs,
        'other_airlines_observations': other_airlines_observations,
        'airline_avg_sentiment': airline_avg_sentiment,
        'other_airlines_avg_sentiment': other_airlines_avg_sentiment
    }

# Print the results
for airline, results in t_test_results.items():
    print(f"Results for {airline}:")
    print(f"Observations: {results['airline_obs']}")
    print(f"Average Sentiment: {results['airline_avg_sentiment']}")
    print(f"Other Airlines Observations: {results['other_airlines_observations']}")
    print(f"Other Airlines Average Sentiment: {results['other_airlines_avg_sentiment']}")
    print(f"T-Statistic: {results['t_stat']}")
    print(f"P-Value: {results['p_value']}")
    print(f"One-Tail P-Value: {results['one_tail_p_value']}")
    print("\n")  # Adds a newline for better readability

Results for Allegiant Air:
Observations: 86
Average Sentiment: 1.5348837209302326
Other Airlines Observations: 1133
Other Airlines Average Sentiment: 2.2162400706090026
T-Statistic: -6.113300843909414
P-Value: 1.4863567105282974e-08
One-Tail P-Value: 7.431783552641487e-09


Results for Frontier Airlines:
Observations: 73
Average Sentiment: 1.547945205479452
Other Airlines Observations: 1146
Other Airlines Average Sentiment: 2.2076788830715532
T-Statistic: -6.0630345267067804
P-Value: 2.6800052032011978e-08
One-Tail P-Value: 1.3400026016005989e-08


Results for Spirit Airlines:
Observations: 86
Average Sentiment: 1.6511627906976745
Other Airlines Observations: 1133
Other Airlines Average Sentiment: 2.207413945278023
T-Statistic: -4.599301515183189
P-Value: 1.174736234095787e-05
One-Tail P-Value: 5.873681170478935e-06




In [6]:
#Seat Comfort  International

# List of airlines to test
airlines = ['Frontier', 'Jetblue', 'Jetstar']

# Initialize a dictionary to store results
t_test_results = {}

# Loop through each airline and perform the tests
for airline in airlines:
    # Filter for current airline's negative domestic flights
    airline_filter = (data['Airline Name'].str.contains(airline, case=False, na=False)) & \
                     (data['flight_type'] == 'International')
    airline_data = data[airline_filter]
    airline_avg_sentiment = airline_data['Seat Comfort'].mean()
    airline_obs = len(airline_data)

    # Filter for other airlines' negative domestic flights
    other_airlines_filter = (~data['Airline Name'].str.contains(airline, case=False, na=False)) & \
                            (data['flight_type'] == 'International')
    other_airlines_data = data[other_airlines_filter]
    other_airlines_avg_sentiment = other_airlines_data['Seat Comfort'].mean()
    other_airlines_observations = len(other_airlines_data)

    # Perform t-test
    t_stat, p_value = stats.ttest_ind(airline_data['Seat Comfort'],
                                      other_airlines_data['Seat Comfort'],
                                      equal_var=False)

    # Calculate one-tail p-value
    one_tail_p_value = p_value / 2

    # Store results in the dictionary
    t_test_results[airline] = {
        't_stat': t_stat,
        'p_value': p_value,
        'one_tail_p_value': one_tail_p_value,
        'airline_obs': airline_obs,
        'other_airlines_observations': other_airlines_observations,
        'airline_avg_sentiment': airline_avg_sentiment,
        'other_airlines_avg_sentiment': other_airlines_avg_sentiment
    }

# Print the results
for airline, results in t_test_results.items():
    print(f"Results for {airline}:")
    print(f"Observations: {results['airline_obs']}")
    print(f"Average Sentiment: {results['airline_avg_sentiment']}")
    print(f"Other Airlines Observations: {results['other_airlines_observations']}")
    print(f"Other Airlines Average Sentiment: {results['other_airlines_avg_sentiment']}")
    print(f"T-Statistic: {results['t_stat']}")
    print(f"P-Value: {results['p_value']}")
    print(f"One-Tail P-Value: {results['one_tail_p_value']}")
    print("\n")  # Adds a newline for better readability

Results for Frontier:
Observations: 8
Average Sentiment: 1.0
Other Airlines Observations: 1361
Other Airlines Average Sentiment: 2.46069066862601
T-Statistic: -39.36810738361101
P-Value: 7.018843395815594e-227
One-Tail P-Value: 3.509421697907797e-227


Results for Jetblue:
Observations: 12
Average Sentiment: 2.25
Other Airlines Observations: 1357
Other Airlines Average Sentiment: 2.453942520265291
T-Statistic: -0.4740379918677167
P-Value: 0.6446071327302156
One-Tail P-Value: 0.3223035663651078


Results for Jetstar:
Observations: 3
Average Sentiment: 1.0
Other Airlines Observations: 1366
Other Airlines Average Sentiment: 2.4553440702781844
T-Statistic: -39.286308509050016
P-Value: 1.7957953580557512e-226
One-Tail P-Value: 8.978976790278756e-227




  res = hypotest_fun_out(*samples, **kwds)


Inflight Entertainment

In [7]:
#Inflight Entertainment Domestic

# List of airlines to test
airlines = ['Avianca', 'Spirit Airlines', 'US Airways']

# Initialize a dictionary to store results
t_test_results = {}

# Loop through each airline and perform the tests
for airline in airlines:
    # Filter for current airline's negative domestic flights
    airline_filter = (data['Airline Name'].str.contains(airline, case=False, na=False)) & \
                     (data['flight_type'] == 'Domestic')
    airline_data = data[airline_filter]
    airline_avg_sentiment = airline_data['Inflight Entertainment'].mean()
    airline_obs = len(airline_data)

    # Filter for other airlines' negative domestic flights
    other_airlines_filter = (~data['Airline Name'].str.contains(airline, case=False, na=False)) & \
                            (data['flight_type'] == 'Domestic')
    other_airlines_data = data[other_airlines_filter]
    other_airlines_avg_sentiment = other_airlines_data['Inflight Entertainment'].mean()
    other_airlines_observations = len(other_airlines_data)

    # Perform t-test
    t_stat, p_value = stats.ttest_ind(airline_data['Inflight Entertainment'],
                                      other_airlines_data['Inflight Entertainment'],
                                      equal_var=False)

    # Calculate one-tail p-value
    one_tail_p_value = p_value / 2


    # Store results in the dictionary
    t_test_results[airline] = {
        't_stat': t_stat,
        'p_value': p_value,
        'one_tail_p_value': one_tail_p_value,
        'airline_obs': airline_obs,
        'other_airlines_observations': other_airlines_observations,
        'airline_avg_sentiment': airline_avg_sentiment,
        'other_airlines_avg_sentiment': other_airlines_avg_sentiment
    }

# Print the results
for airline, results in t_test_results.items():
    print(f"Results for {airline}:")
    print(f"Observations: {results['airline_obs']}")
    print(f"Average Sentiment: {results['airline_avg_sentiment']}")
    print(f"Other Airlines Observations: {results['other_airlines_observations']}")
    print(f"Other Airlines Average Sentiment: {results['other_airlines_avg_sentiment']}")
    print(f"T-Statistic: {results['t_stat']}")
    print(f"P-Value: {results['p_value']}")
    print(f"One-Tail P-Value: {results['one_tail_p_value']}")
    print("\n")  # Adds a newline for better readability

Results for Avianca:
Observations: 3
Average Sentiment: 1.3333333333333333
Other Airlines Observations: 1216
Other Airlines Average Sentiment: 1.96875
T-Statistic: -1.8997756148196903
P-Value: 0.19613377449046387
One-Tail P-Value: 0.09806688724523194


Results for Spirit Airlines:
Observations: 86
Average Sentiment: 1.5232558139534884
Other Airlines Observations: 1133
Other Airlines Average Sentiment: 2.000882612533098
T-Statistic: -7.769401472484296
P-Value: 1.522050217756363e-12
One-Tail P-Value: 7.610251088781815e-13


Results for US Airways:
Observations: 46
Average Sentiment: 1.7173913043478262
Other Airlines Observations: 1173
Other Airlines Average Sentiment: 1.9769820971867007
T-Statistic: -3.561372831828068
P-Value: 0.000712174561291259
One-Tail P-Value: 0.0003560872806456295




In [None]:
#Inflight Entertainment International

# List of airlines to test
airlines = ['Eurowing', 'Jetstar Airways', 'Flair']

# Initialize a dictionary to store results
t_test_results = {}

# Loop through each airline and perform the tests
for airline in airlines:
    # Filter for current airline's negative domestic flights
    airline_filter = (data['Airline Name'].str.contains(airline, case=False, na=False)) & \
                     (data['flight_type'] == 'International')
    airline_data = data[airline_filter]
    airline_avg_sentiment = airline_data['Inflight Entertainment'].mean()
    airline_obs = len(airline_data)

    # Filter for other airlines' negative domestic flights
    other_airlines_filter = (~data['Airline Name'].str.contains(airline, case=False, na=False)) & \
                            (data['flight_type'] == 'International')
    other_airlines_data = data[other_airlines_filter]
    other_airlines_avg_sentiment = other_airlines_data['Inflight Entertainment'].mean()
    other_airlines_observations = len(other_airlines_data)

    # Perform t-test
    t_stat, p_value = stats.ttest_ind(airline_data['Inflight Entertainment'],
                                      other_airlines_data['Inflight Entertainment'],
                                      equal_var=False)

    # Calculate one-tail p-value
    one_tail_p_value = p_value / 2


    # Store results in the dictionary
    t_test_results[airline] = {
        't_stat': t_stat,
        'p_value': p_value,
        'one_tail_p_value': one_tail_p_value,
        'airline_obs': airline_obs,
        'other_airlines_observations': other_airlines_observations,
        'airline_avg_sentiment': airline_avg_sentiment,
        'other_airlines_avg_sentiment': other_airlines_avg_sentiment
    }

# Print the results
for airline, results in t_test_results.items():
    print(f"Results for {airline}:")
    print(f"Observations: {results['airline_obs']}")
    print(f"Average Sentiment: {results['airline_avg_sentiment']}")
    print(f"Other Airlines Observations: {results['other_airlines_observations']}")
    print(f"Other Airlines Average Sentiment: {results['other_airlines_avg_sentiment']}")
    print(f"T-Statistic: {results['t_stat']}")
    print(f"P-Value: {results['p_value']}")
    print(f"One-Tail P-Value: {results['one_tail_p_value']}")
    print("\n")  # Adds a newline for better readability

Results for Eurowing:
Observations: 3
Average Sentiment: 1.3333333333333333
Other Airlines Observations: 1366
Other Airlines Average Sentiment: 2.279648609077599
T-Statistic: -2.8253468060471016
P-Value: 0.10351427855309442
One-Tail P-Value: 0.05175713927654721


Results for Jetstar Airways:
Observations: 3
Average Sentiment: 1.3333333333333333
Other Airlines Observations: 1366
Other Airlines Average Sentiment: 2.279648609077599
T-Statistic: -2.8253468060471016
P-Value: 0.10351427855309442
One-Tail P-Value: 0.05175713927654721


Results for Flair:
Observations: 4
Average Sentiment: 1.25
Other Airlines Observations: 1365
Other Airlines Average Sentiment: 2.2805860805860805
T-Statistic: -4.087411477491211
P-Value: 0.024792115143676432
One-Tail P-Value: 0.012396057571838216




Ground Service

In [None]:
#Ground Service Domestic

# List of airlines to test
airlines = ['Avianca', 'Frontier Airlines', 'LAN Airlines']

# Initialize a dictionary to store results
t_test_results = {}

# Loop through each airline and perform the tests
for airline in airlines:
    # Filter for current airline's negative domestic flights
    airline_filter = (data['Airline Name'].str.contains(airline, case=False, na=False)) & \
                     (data['flight_type'] == 'Domestic')
    airline_data = data[airline_filter]
    airline_avg_sentiment = airline_data['Ground Service'].mean()
    airline_obs = len(airline_data)

    # Filter for other airlines' negative domestic flights
    other_airlines_filter = (~data['Airline Name'].str.contains(airline, case=False, na=False)) & \
                            (data['flight_type'] == 'Domestic')
    other_airlines_data = data[other_airlines_filter]
    other_airlines_avg_sentiment = other_airlines_data['Ground Service'].mean()
    other_airlines_observations = len(other_airlines_data)

    # Perform t-test
    t_stat, p_value = stats.ttest_ind(airline_data['Ground Service'],
                                      other_airlines_data['Ground Service'],
                                      equal_var=False)

    # Calculate one-tail p-value
    one_tail_p_value = p_value / 2

    # Store results in the dictionary
    t_test_results[airline] = {
        't_stat': t_stat,
        'p_value': p_value,
        'one_tail_p_value': one_tail_p_value,
        'airline_obs': airline_obs,
        'other_airlines_observations': other_airlines_observations,
        'airline_avg_sentiment': airline_avg_sentiment,
        'other_airlines_avg_sentiment': other_airlines_avg_sentiment
    }

# Print the results
for airline, results in t_test_results.items():
    print(f"Results for {airline}:")
    print(f"Observations: {results['airline_obs']}")
    print(f"Average Sentiment: {results['airline_avg_sentiment']}")
    print(f"Other Airlines Observations: {results['other_airlines_observations']}")
    print(f"Other Airlines Average Sentiment: {results['other_airlines_avg_sentiment']}")
    print(f"T-Statistic: {results['t_stat']}")
    print(f"P-Value: {results['p_value']}")
    print(f"One-Tail P-Value: {results['one_tail_p_value']}")
    print("\n")  # Adds a newline for better readability

Results for Avianca:
Observations: 3
Average Sentiment: 1.0
Other Airlines Observations: 1216
Other Airlines Average Sentiment: 1.8018092105263157
T-Statistic: -20.54984035387586
P-Value: 8.92526688816389e-81
One-Tail P-Value: 4.462633444081945e-81


Results for Frontier Airlines:
Observations: 73
Average Sentiment: 1.2328767123287672
Other Airlines Observations: 1146
Other Airlines Average Sentiment: 1.8359511343804538
T-Statistic: -7.999294047734974
P-Value: 3.809480213026414e-13
One-Tail P-Value: 1.904740106513207e-13


Results for LAN Airlines:
Observations: 3
Average Sentiment: 1.0
Other Airlines Observations: 1216
Other Airlines Average Sentiment: 1.8018092105263157
T-Statistic: -20.54984035387586
P-Value: 8.92526688816389e-81
One-Tail P-Value: 4.462633444081945e-81




In [8]:
##Ground Service International

# List of airlines to test
airlines = ['Flair Airlines', 'Spirit Airlines', 'TAM Airlines']

# Initialize a dictionary to store results
t_test_results = {}

# Loop through each airline and perform the tests
for airline in airlines:
    # Filter for current airline's negative domestic flights
    airline_filter = (data['Airline Name'].str.contains(airline, case=False, na=False)) & \
                     (data['flight_type'] == 'International')
    airline_data = data[airline_filter]
    airline_avg_sentiment = airline_data['Ground Service'].mean()
    airline_obs = len(airline_data)

    # Filter for other airlines' negative domestic flights
    other_airlines_filter = (~data['Airline Name'].str.contains(airline, case=False, na=False)) & \
                            (data['flight_type'] == 'International')
    other_airlines_data = data[other_airlines_filter]
    other_airlines_avg_sentiment = other_airlines_data['Ground Service'].mean()
    other_airlines_observations = len(other_airlines_data)

    # Perform t-test
    t_stat, p_value = stats.ttest_ind(airline_data['Ground Service'],
                                      other_airlines_data['Ground Service'],
                                      equal_var=False)

    # Calculate one-tail p-value
    one_tail_p_value = p_value / 2

    # Store results in the dictionary
    t_test_results[airline] = {
        't_stat': t_stat,
        'p_value': p_value,
        'one_tail_p_value': one_tail_p_value,
        'airline_obs': airline_obs,
        'other_airlines_observations': other_airlines_observations,
        'airline_avg_sentiment': airline_avg_sentiment,
        'other_airlines_avg_sentiment': other_airlines_avg_sentiment
    }

# Print the results
for airline, results in t_test_results.items():
    print(f"Results for {airline}:")
    print(f"Observations: {results['airline_obs']}")
    print(f"Average Sentiment: {results['airline_avg_sentiment']}")
    print(f"Other Airlines Observations: {results['other_airlines_observations']}")
    print(f"Other Airlines Average Sentiment: {results['other_airlines_avg_sentiment']}")
    print(f"T-Statistic: {results['t_stat']}")
    print(f"P-Value: {results['p_value']}")
    print(f"One-Tail P-Value: {results['one_tail_p_value']}")
    print("\n")  # Adds a newline for better readability

Results for Flair Airlines:
Observations: 4
Average Sentiment: 1.0
Other Airlines Observations: 1365
Other Airlines Average Sentiment: 2.131868131868132
T-Statistic: -28.501768775872378
P-Value: 1.4461112372477606e-140
One-Tail P-Value: 7.230556186238803e-141


Results for Spirit Airlines:
Observations: 7
Average Sentiment: 1.1428571428571428
Other Airlines Observations: 1362
Other Airlines Average Sentiment: 2.133627019089574
T-Statistic: -6.681168337110033
P-Value: 0.0002882652925866248
One-Tail P-Value: 0.0001441326462933124


Results for TAM Airlines:
Observations: 15
Average Sentiment: 1.3333333333333333
Other Airlines Observations: 1354
Other Airlines Average Sentiment: 2.137370753323486
T-Statistic: -2.943635193492951
P-Value: 0.010287144783345244
One-Tail P-Value: 0.005143572391672622




Wifi and Connectivity

In [9]:
#Wifi and Connectivity Domestic

# List of airlines to test
airlines = ['Spirit Airlines', 'Allegiant Air', 'Copa Airlines']

# Initialize a dictionary to store results
t_test_results = {}

# Loop through each airline and perform the tests
for airline in airlines:
    # Filter for current airline's negative domestic flights
    airline_filter = (data['Airline Name'].str.contains(airline, case=False, na=False)) & \
                     (data['flight_type'] == 'Domestic')
    airline_data = data[airline_filter]
    airline_avg_sentiment = airline_data['Wifi & Connectivity'].mean()
    airline_obs = len(airline_data)

    # Filter for other airlines' negative domestic flights
    other_airlines_filter = (~data['Airline Name'].str.contains(airline, case=False, na=False)) & \
                            (data['flight_type'] == 'Domestic')
    other_airlines_data = data[other_airlines_filter]
    other_airlines_avg_sentiment = other_airlines_data['Wifi & Connectivity'].mean()
    other_airlines_observations = len(other_airlines_data)

    # Perform t-test
    t_stat, p_value = stats.ttest_ind(airline_data['Wifi & Connectivity'],
                                      other_airlines_data['Wifi & Connectivity'],
                                      equal_var=False)

    # Calculate one-tail p-value
    one_tail_p_value = p_value / 2

    # Store results in the dictionary
    t_test_results[airline] = {
        't_stat': t_stat,
        'p_value': p_value,
        'one_tail_p_value': one_tail_p_value,
        'airline_obs': airline_obs,
        'other_airlines_observations': other_airlines_observations,
        'airline_avg_sentiment': airline_avg_sentiment,
        'other_airlines_avg_sentiment': other_airlines_avg_sentiment
    }

# Print the results
for airline, results in t_test_results.items():
    print(f"Results for {airline}:")
    print(f"Observations: {results['airline_obs']}")
    print(f"Average Sentiment: {results['airline_avg_sentiment']}")
    print(f"Other Airlines Observations: {results['other_airlines_observations']}")
    print(f"Other Airlines Average Sentiment: {results['other_airlines_avg_sentiment']}")
    print(f"T-Statistic: {results['t_stat']}")
    print(f"P-Value: {results['p_value']}")
    print(f"One-Tail P-Value: {results['one_tail_p_value']}")
    print("\n")  # Adds a newline for better readability

Results for Spirit Airlines:
Observations: 86
Average Sentiment: 1.4883720930232558
Other Airlines Observations: 1133
Other Airlines Average Sentiment: 1.917034421888791
T-Statistic: -7.106622086946875
P-Value: 7.095528483959912e-11
One-Tail P-Value: 3.547764241979956e-11


Results for Allegiant Air:
Observations: 86
Average Sentiment: 1.6511627906976745
Other Airlines Observations: 1133
Other Airlines Average Sentiment: 1.9046778464254193
T-Statistic: -4.360538527917628
P-Value: 2.550662352706383e-05
One-Tail P-Value: 1.2753311763531915e-05


Results for Copa Airlines:
Observations: 11
Average Sentiment: 1.5454545454545454
Other Airlines Observations: 1208
Other Airlines Average Sentiment: 1.8899006622516556
T-Statistic: -2.1599678372935363
P-Value: 0.054802642566750284
One-Tail P-Value: 0.027401321283375142




In [10]:
#Wifi and Connectivity International

# List of airlines to test
airlines = ['Eurowings', 'Qantas Airways', 'Flair airlines']

# Initialize a dictionary to store results
t_test_results = {}

# Loop through each airline and perform the tests
for airline in airlines:
    # Filter for current airline's negative domestic flights
    airline_filter = (data['Airline Name'].str.contains(airline, case=False, na=False)) & \
                     (data['flight_type'] == 'International')
    airline_data = data[airline_filter]
    airline_avg_sentiment = airline_data['Wifi & Connectivity'].mean()
    airline_obs = len(airline_data)

    # Filter for other airlines' negative domestic flights
    other_airlines_filter = (~data['Airline Name'].str.contains(airline, case=False, na=False)) & \
                            (data['flight_type'] == 'International')
    other_airlines_data = data[other_airlines_filter]
    other_airlines_avg_sentiment = other_airlines_data['Wifi & Connectivity'].mean()
    other_airlines_observations = len(other_airlines_data)

    # Perform t-test
    t_stat, p_value = stats.ttest_ind(airline_data['Wifi & Connectivity'],
                                      other_airlines_data['Wifi & Connectivity'],
                                      equal_var=False)

    # Calculate one-tail p-value
    if t_stat < 0:
        one_tail_p_value = p_value / 2
    else:
        one_tail_p_value = 1 - p_value / 2

    # Store results in the dictionary
    t_test_results[airline] = {
        't_stat': t_stat,
        'p_value': p_value,
        'one_tail_p_value': one_tail_p_value,
        'airline_obs': airline_obs,
        'other_airlines_observations': other_airlines_observations,
        'airline_avg_sentiment': airline_avg_sentiment,
        'other_airlines_avg_sentiment': other_airlines_avg_sentiment
    }

# Print the results
for airline, results in t_test_results.items():
    print(f"Results for {airline}:")
    print(f"Observations: {results['airline_obs']}")
    print(f"Average Sentiment: {results['airline_avg_sentiment']}")
    print(f"Other Airlines Observations: {results['other_airlines_observations']}")
    print(f"Other Airlines Average Sentiment: {results['other_airlines_avg_sentiment']}")
    print(f"T-Statistic: {results['t_stat']}")
    print(f"P-Value: {results['p_value']}")
    print(f"One-Tail P-Value: {results['one_tail_p_value']}")
    print("\n")  # Adds a newline for better readability

Results for Eurowings:
Observations: 3
Average Sentiment: 1.3333333333333333
Other Airlines Observations: 1366
Other Airlines Average Sentiment: 1.917276720351391
T-Statistic: -1.7474007726542595
P-Value: 0.22141588759336905
One-Tail P-Value: 0.11070794379668453


Results for Qantas Airways:
Observations: 3
Average Sentiment: 1.3333333333333333
Other Airlines Observations: 1366
Other Airlines Average Sentiment: 1.917276720351391
T-Statistic: -1.7474007726542595
P-Value: 0.22141588759336905
One-Tail P-Value: 0.11070794379668453


Results for Flair airlines:
Observations: 4
Average Sentiment: 1.25
Other Airlines Observations: 1365
Other Airlines Average Sentiment: 1.917948717948718
T-Statistic: -2.6598125449810337
P-Value: 0.07490916375272869
One-Tail P-Value: 0.03745458187636434




Cabin Satff

In [11]:
#Cabin Satff Domestic

# List of airlines to test
airlines = ['Frontier Airlines', 'Silver Airways', 'LAN Airlines']

# Initialize a dictionary to store results
t_test_results = {}

# Loop through each airline and perform the tests
for airline in airlines:
    # Filter for current airline's negative domestic flights
    airline_filter = (data['Airline Name'].str.contains(airline, case=False, na=False)) & \
                     (data['flight_type'] == 'Domestic')

    airline_data = data[airline_filter]
    airline_avg_sentiment = airline_data['Cabin Staff Service'].mean()
    airline_obs = len(airline_data)

    # Filter for other airlines' negative domestic flights
    other_airlines_filter = (~data['Airline Name'].str.contains(airline, case=False, na=False)) & \
                            (data['flight_type'] == 'Domestic')

    other_airlines_data = data[other_airlines_filter]
    other_airlines_avg_sentiment = other_airlines_data['Cabin Staff Service'].mean()
    other_airlines_observations = len(other_airlines_data)

    # Perform t-test
    t_stat, p_value = stats.ttest_ind(airline_data['Cabin Staff Service'],
                                      other_airlines_data['Cabin Staff Service'],
                                      equal_var=False)

    # Calculate one-tail p-value
    if t_stat < 0:
        one_tail_p_value = p_value / 2
    else:
        one_tail_p_value = 1 - p_value / 2

    # Store results in the dictionary
    t_test_results[airline] = {
        't_stat': t_stat,
        'p_value': p_value,
        'one_tail_p_value': one_tail_p_value,
        'airline_obs': airline_obs,
        'other_airlines_observations': other_airlines_observations,
        'airline_avg_sentiment': airline_avg_sentiment,
        'other_airlines_avg_sentiment': other_airlines_avg_sentiment
    }

# Print the results
for airline, results in t_test_results.items():
    print(f"Results for {airline}:")
    print(f"Observations: {results['airline_obs']}")
    print(f"Average Sentiment: {results['airline_avg_sentiment']}")
    print(f"Other Airlines Observations: {results['other_airlines_observations']}")
    print(f"Other Airlines Average Sentiment: {results['other_airlines_avg_sentiment']}")
    print(f"T-Statistic: {results['t_stat']}")
    print(f"P-Value: {results['p_value']}")
    print(f"One-Tail P-Value: {results['one_tail_p_value']}")
    print("\n")  # Adds a newline for better readability

Results for Frontier Airlines:
Observations: 73
Average Sentiment: 1.7534246575342465
Other Airlines Observations: 1146
Other Airlines Average Sentiment: 2.4650959860383943
T-Statistic: -6.00606206569406
P-Value: 3.3187707736527204e-08
One-Tail P-Value: 1.6593853868263602e-08


Results for Silver Airways:
Observations: 74
Average Sentiment: 1.837837837837838
Other Airlines Observations: 1145
Other Airlines Average Sentiment: 2.4602620087336247
T-Statistic: -4.068907306426157
P-Value: 0.00010395393086360435
One-Tail P-Value: 5.1976965431802175e-05


Results for LAN Airlines:
Observations: 3
Average Sentiment: 1.6666666666666667
Other Airlines Observations: 1216
Other Airlines Average Sentiment: 2.424342105263158
T-Statistic: -1.1342275908954162
P-Value: 0.37354127733161063
One-Tail P-Value: 0.18677063866580532




In [None]:
#Cabin Satff International

# List of airlines to test
airlines = ['Eurowings', 'Flair Airlines','Frontier Airlines']

# Initialize a dictionary to store results
t_test_results = {}

# Loop through each airline and perform the tests
for airline in airlines:
    # Filter for current airline's negative domestic flights
    airline_filter = (data['Airline Name'].str.contains(airline, case=False, na=False)) & \
                     (data['flight_type'] == 'International')

    airline_data = data[airline_filter]
    airline_avg_sentiment = airline_data['Cabin Staff Service'].mean()
    airline_obs = len(airline_data)

    # Filter for other airlines' negative domestic flights
    other_airlines_filter = (~data['Airline Name'].str.contains(airline, case=False, na=False)) & \
                            (data['flight_type'] == 'International')

    other_airlines_data = data[other_airlines_filter]
    other_airlines_avg_sentiment = other_airlines_data['Cabin Staff Service'].mean()
    other_airlines_observations = len(other_airlines_data)

    # Perform t-test
    t_stat, p_value = stats.ttest_ind(airline_data['Cabin Staff Service'],
                                      other_airlines_data['Cabin Staff Service'],
                                      equal_var=False)

    # Calculate one-tail p-value
    if t_stat < 0:
        one_tail_p_value = p_value / 2
    else:
        one_tail_p_value = 1 - p_value / 2

    # Store results in the dictionary
    t_test_results[airline] = {
        't_stat': t_stat,
        'p_value': p_value,
        'one_tail_p_value': one_tail_p_value,
        'airline_obs': airline_obs,
        'other_airlines_observations': other_airlines_observations,
        'airline_avg_sentiment': airline_avg_sentiment,
        'other_airlines_avg_sentiment': other_airlines_avg_sentiment
    }

# Print the results
for airline, results in t_test_results.items():
    print(f"Results for {airline}:")
    print(f"Observations: {results['airline_obs']}")
    print(f"Average Sentiment: {results['airline_avg_sentiment']}")
    print(f"Other Airlines Observations: {results['other_airlines_observations']}")
    print(f"Other Airlines Average Sentiment: {results['other_airlines_avg_sentiment']}")
    print(f"T-Statistic: {results['t_stat']}")
    print(f"P-Value: {results['p_value']}")
    print(f"One-Tail P-Value: {results['one_tail_p_value']}")
    print("\n")  # Adds a newline for better readability

Results for Eurowings:
Observations: 3
Average Sentiment: 1.6666666666666667
Other Airlines Observations: 1366
Other Airlines Average Sentiment: 2.7013177159590045
T-Statistic: -1.549171170352969
P-Value: 0.2605856220315078
One-Tail P-Value: 0.1302928110157539


Results for Flair Airlines:
Observations: 4
Average Sentiment: 1.0
Other Airlines Observations: 1365
Other Airlines Average Sentiment: 2.704029304029304
T-Statistic: -42.462324914864546
P-Value: 8.981977578841396e-252
One-Tail P-Value: 4.490988789420698e-252


Results for Frontier Airlines:
Observations: 8
Average Sentiment: 1.0
Other Airlines Observations: 1361
Other Airlines Average Sentiment: 2.7090374724467305
T-Statistic: -42.54500402702393
P-Value: 3.4315451020098315e-252
One-Tail P-Value: 1.7157725510049157e-252




  res = hypotest_fun_out(*samples, **kwds)
