## Observations and Insights 

In [27]:
%matplotlib widget

In [28]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import scipy.stats as st

# Study data files
mouse_metadata_path = "data/Mouse_metadata.csv"
study_results_path = "data/Study_results.csv"

# Read the mouse data and the study results
mouse_metadata = pd.read_csv(mouse_metadata_path)
study_results = pd.read_csv(study_results_path)

# Combine the data into a single dataset and display the data table for preview
combined_mousestudy_df = pd.merge(mouse_metadata, study_results,
                                 how='left', on='Mouse ID')

# sorting by mouse id and remove values that are duplicated
combined_mousestudy_df.sort_values(["Mouse ID", "Timepoint"], inplace = True) 

combined_mousestudy_df.loc[combined_mousestudy_df.duplicated(subset = ["Mouse ID", "Timepoint"]), "Mouse ID"]

combined_mousestudy_df = combined_mousestudy_df.loc[combined_mousestudy_df["Mouse ID"] != "g989", :]
 
#Display data
combined_mousestudy_df["Tumor Volume (mm3)"] = combined_mousestudy_df["Tumor Volume (mm3)"].map('{:,.2f}'.format)

combined_mousestudy_df.head()


Unnamed: 0,Mouse ID,Drug Regimen,Sex,Age_months,Weight (g),Timepoint,Tumor Volume (mm3),Metastatic Sites
454,a203,Infubinol,Female,20,23,0,45.0,0
455,a203,Infubinol,Female,20,23,5,48.51,0
456,a203,Infubinol,Female,20,23,10,51.85,1
457,a203,Infubinol,Female,20,23,15,52.78,1
458,a203,Infubinol,Female,20,23,20,55.17,1


In [29]:
combined_mousestudy_df["Drug Regimen"].unique()

array(['Infubinol', 'Placebo', 'Ceftamin', 'Stelasyn', 'Zoniferol',
       'Ramicane', 'Ketapril', 'Propriva', 'Naftisol', 'Capomulin'],
      dtype=object)

## Summary Statistics

In [35]:
#Create drug regimen data frame
Drugs = combined_mousestudy_df[["Drug Regimen", "Tumor Volume (mm3)"]]

# Summary statistics table 
# mean, median, variance, standard deviation, and SEM (standard error of the mean) of the tumor volume for each regimen

In [20]:
# Summary statistics table 
# mean, median, variance, standard deviation, and SEM (standard error of the mean) of the tumor volume for each regimen

tumor_volume_avg = combined_mousestudy_df["Tumor Volume (mm3)"].mean()
tumor_volume_median = combined_mousestudy_df["Tumor Volume (mm3)"].median()
tumor_volume_variance = combined_mousestudy_df["Tumor Volume (mm3)"].var()
tumor_volume_standev = combined_mousestudy_df["Tumor Volume (mm3)"].std()
tumor_volume_sem = combined_mousestudy_df["Tumor Volume (mm3)"].sem()

Summary_tumor_volume = pd.DataFrame({'Avg Tumor Volume': [tumor_volume_avg], 'Mediam Tumor Volume': [tumor_volume_median], 
                                     'Variance': [tumor_volume_variance], 'Standard Deviation': [tumor_volume_standev], 
                                     'Standard Error of Mean': [tumor_volume_sem]})
Summary_tumor_volume

TypeError: Could not convert 45.0048.5151.8552.7855.1756.7959.5261.9363.5967.9745.0046.9848.5950.5354.4657.4159.8660.9063.1065.5345.0048.7249.6053.8357.0160.1364.9666.5669.5970.7245.0046.8047.3749.7350.5153.5854.4456.3560.9263.0045.0048.9553.5255.2757.2959.0163.4445.0046.1147.7349.9352.2054.2155.9160.3561.7766.7945.0045.4740.7641.4838.0938.7039.1339.7240.2638.4145.0044.0144.5143.0041.7142.2942.7941.7442.5043.0545.0047.4649.7845.0046.4148.4351.9953.6854.7056.2057.3157.9360.1245.0038.7236.4335.5935.9536.5636.9537.6238.2638.8145.0046.2049.5150.9252.3754.3857.0345.0045.5546.3846.9145.8741.4837.2135.1335.7832.9845.0046.8747.6648.9549.4951.9455.4558.0960.5766.0845.0046.5547.8749.5350.7151.8554.3856.5158.6162.1945.0047.0150.1652.5454.0656.7760.4145.0045.7049.7951.2354.8356.9760.0763.3069.2775.0045.0045.6947.9752.3454.6056.4159.9264.0567.2172.2645.0046.2347.1547.8451.4652.1353.4056.8158.4662.7745.0045.6543.2743.7842.7343.2640.6137.9738.3838.9845.0047.1548.3249.1953.9855.7545.0045.0046.2147.6651.6853.4356.0645.0047.4148.0451.3855.6557.0461.1965.7169.9773.0545.0041.5342.0039.5237.9538.6239.1739.8538.2638.9445.0048.0149.1351.5954.4455.0855.7445.0049.1650.3451.6253.9856.4760.9164.2667.1972.5645.0048.7549.9951.8356.7461.4664.1567.8269.4372.2345.0045.7949.0353.6654.5756.9757.8261.0765.7167.9445.0045.7348.1849.2751.9556.2959.0159.8965.0265.8245.0047.6948.5352.7254.0855.0857.4262.2463.2864.5845.0036.3245.0049.3450.5752.2354.8858.2763.7465.8170.2274.0445.0045.7244.4545.1139.5137.7538.3445.0046.5647.2951.4152.6054.5657.1559.4660.8661.8445.0046.6347.5751.9955.5856.2958.0545.0047.7849.2251.5352.8257.1160.1064.2966.6069.0445.0045.5846.2946.9443.1343.6044.1237.8032.8333.4045.0047.3149.5050.6053.0158.2160.2665.9567.6969.8245.0045.7746.6648.3749.7651.8356.1057.7362.1845.0048.6949.8152.8656.7158.8960.5061.1262.5765.4245.0045.4849.7852.9553.6857.5360.9745.0046.3550.9753.2755.4856.5560.7561.8764.1845.0045.0046.6247.4745.0041.7542.4339.4737.6538.1038.7237.7138.2737.3145.0045.9246.9747.7851.7354.2855.3456.4860.2345.0045.7047.3951.7952.6155.2256.4658.2560.2463.1145.0047.2451.3552.8356.6160.6062.4666.9570.7273.2145.0046.1448.5349.3552.5355.1445.0047.1149.4354.0555.2557.4157.9960.0661.5362.4445.0045.6647.2548.4350.3451.3954.9858.0962.8268.3645.0045.8246.4143.5544.0044.6645.3543.2244.0140.6645.0047.0048.1849.9945.0047.3147.9048.7451.1152.1856.8757.7545.0048.1945.0045.5947.2248.3549.6153.0854.3656.5258.3260.9245.0047.0345.0046.3748.1548.7245.0046.5751.0753.9558.8460.2565.8966.7471.1173.3245.0045.0038.8035.6232.6230.4945.0046.4048.1949.1152.0845.0048.7953.4458.1462.7164.6669.1671.9145.0045.8446.3042.1742.9642.3742.8738.9536.3637.0745.0046.5948.2749.6551.4555.6758.0060.3862.2268.1645.0044.0244.5045.2245.9346.8144.2244.7045.5740.1645.0048.7849.6553.6555.1057.5261.1164.0967.7469.8745.0046.1950.0951.0155.0955.7558.9560.8661.7745.0047.6649.1952.6854.6456.8560.3362.3368.5370.4945.0045.8540.1740.6841.2135.5734.9530.9631.3729.1345.0046.8848.1851.0645.0049.4751.3756.1857.9459.5563.6067.2171.1574.1045.0045.7546.2350.6952.0053.7355.4645.0045.0047.7845.0044.0741.0240.3335.3534.0834.7135.1535.5633.5645.0041.0241.6339.1639.6938.2539.0139.7740.4436.3745.0046.8549.8651.7455.0956.6959.1364.9367.2945.0046.6647.5245.0042.2642.9943.5343.9744.6045.2645.9446.8247.6945.0047.2448.6949.5451.8852.9353.6055.6856.8458.6345.0046.7648.2848.8650.8753.3045.0045.6043.4237.9838.5334.9735.5836.1836.8437.3145.0046.4950.4251.4255.9756.5860.5962.1364.3065.3445.0045.8446.4347.3248.1642.4243.0143.7744.5938.1345.0046.5948.0251.1652.9445.0045.6446.4143.3144.0244.5638.0438.7545.0046.8048.5350.7054.0155.7756.8058.7160.0761.8545.0046.7148.3549.5950.9451.8154.4056.9662.3364.2945.0047.2448.1751.4555.5058.0660.0162.7367.2169.5645.0044.0144.5045.2542.1737.8634.7635.1731.0031.5645.0048.4150.1451.1754.3757.0661.2464.0667.7870.6545.0045.6246.3441.1341.6439.9334.6735.1235.5036.1345.0047.9249.3851.0752.0054.6159.9963.3366.6268.9245.0046.2750.1854.4357.8259.5063.4766.0867.4273.7245.0038.8335.0134.2233.0033.4631.1026.5524.3722.0545.0046.6150.3053.2454.7857.4359.7560.5464.1466.2045.0046.6147.6649.6952.1145.0046.0446.6148.7850.1845.0045.7349.7551.3252.6945.0048.2749.4750.4854.4855.6759.2462.1245.0049.2050.5254.4757.0658.7260.6166.5867.5769.3045.0047.6549.2749.9950.9852.3354.4055.3658.6560.7545.0049.4853.6545.0046.6750.6645.0046.2548.1849.4152.2352.8558.0961.4163.8467.7545.0045.6147.2650.5251.9155.8157.9245.0045.8546.7647.4948.0744.0144.7140.2140.7741.4845.0045.8146.7845.0046.2749.6850.9552.6253.1855.3356.4759.2159.8545.0045.9247.0149.0450.7354.2356.6561.4662.9963.9545.0048.7450.8254.2459.6265.0166.6069.1373.6976.6745.0046.1748.3549.2953.2454.9556.3257.6059.4464.3045.0045.0045.4646.1544.0644.8145.3539.3537.6838.3438.8545.0046.6247.5048.6752.6454.0845.0049.0150.8655.9161.1564.8967.7168.6970.2175.1245.0045.5247.6552.1145.0043.0043.7539.9036.7137.4437.9738.6335.1130.5645.0049.0550.5551.1753.7657.6260.8662.5468.2169.2545.0041.4136.8335.4634.2633.1231.7630.8331.3828.4345.0048.5650.9753.1556.7862.2564.9069.2770.8073.9045.0047.0145.0045.6246.4139.8038.9137.7038.2132.5632.9533.3345.0046.4347.2048.4849.2553.9755.0457.1259.8363.5945.0045.5240.3836.9437.4833.2133.8234.4934.9531.1045.0045.0046.1045.0047.3551.0454.2254.8256.1760.1745.0047.5549.1545.0046.0946.8247.8049.2653.4155.4157.3858.0145.0045.8248.7951.7452.6056.8659.6360.3666.2345.0046.0847.4749.8345.0045.5947.3648.6850.8652.0754.5055.1257.2059.7445.0048.9449.7051.3856.1860.5262.0345.0047.0650.1354.7958.9761.1066.3370.1371.4578.5745.0045.5447.0845.0046.5147.1551.5153.6254.7459.6565.3671.1772.4645.0046.8948.2050.0245.0046.7651.1255.8960.6165.7468.2269.0970.2773.0645.0046.8848.6749.6850.3452.3254.8355.6345.0045.7045.0045.0046.7647.5748.2551.8354.7656.9258.5959.9062.3345.0046.7248.2549.8751.9653.1857.7760.2464.4945.0049.2750.9151.9954.9156.2857.0557.6361.3863.4945.0049.0551.5853.6856.5362.1167.1067.8774.1175.2945.0046.5648.6749.7754.2155.3445.0048.6753.3655.2556.5958.1063.2766.4969.0445.0046.8350.5252.2052.9154.5156.4157.5459.3161.4345.0047.0047.5549.6650.3652.5456.3459.1345.0047.8651.2445.0046.7247.9549.1651.9152.7854.6645.0046.7847.8448.4750.2452.4354.9559.2564.1945.0045.8350.3152.1352.6757.2659.3660.8463.1968.6145.0045.9647.0148.3251.1951.9752.6553.7145.0045.7742.5441.4041.9342.5843.3443.8144.4745.2245.0045.6344.9945.8946.5940.1540.6736.5645.0047.1849.0050.5853.2955.6858.0663.1368.5070.8345.0047.1248.5949.2250.2352.7155.0460.3362.0366.1045.0048.5149.1953.0955.2657.7158.4145.0045.6046.0646.5445.0045.7839.0135.4636.0233.8932.6833.0731.8032.3845.0047.0748.7951.0751.9052.9454.6959.2260.1962.6745.0046.8949.6552.4854.1157.9060.3464.7366.6469.7845.0045.6339.4540.0240.7737.6138.2436.0036.5237.2345.0046.8648.5250.2245.0045.5742.7143.5344.1442.6643.4245.0045.7446.5447.3743.2341.0941.6840.4041.0441.5845.0045.6449.0550.8252.0155.6545.0045.8347.2449.2351.6253.8055.8445.0047.4652.1857.2262.3564.1245.0047.1949.0045.0043.8837.6138.1836.8733.9532.9628.3325.4723.3445.0047.5848.1552.0853.7456.4960.0145.0046.8547.8948.5749.2050.9752.7554.8156.9962.1145.0038.7134.8535.2835.9336.3435.4735.8532.8030.2845.0048.2452.7854.3357.0558.5563.6764.7867.2272.5945.0046.6045.0043.1843.6941.8542.6343.0643.5744.1640.1740.7345.0047.4649.0049.7851.4956.1856.9257.7459.1364.9145.0048.0548.9649.6551.0655.5359.2863.7667.6568.7145.0045.9046.7544.4439.0737.3432.8733.5233.9534.4645.0045.0045.9246.3948.0952.6455.8857.7060.4661.5363.4245.0046.3650.7055.5857.2359.8364.2367.7469.7375.1145.0047.8952.6153.4656.5345.0045.7947.4048.5250.3852.9345.0045.0045.5646.4247.2346.1146.7147.6247.0043.4540.6745.0045.6949.2450.6653.1956.0657.3158.0960.4766.2745.0045.7646.5747.2140.3435.5035.9835.4636.0231.0245.0045.9946.7347.6749.1145.0045.0046.2048.1352.6054.2556.7245.0046.1147.5450.6755.7357.6959.3361.8965.4745.0046.2545.0046.2250.6545.0046.0247.8352.1053.7256.0857.9963.1945.0047.1951.5052.6154.0545.0047.0548.1949.4145.0048.1550.3651.5445.0047.1648.9750.5551.3045.0045.7039.8540.4639.6540.1640.7541.4442.1540.6645.0048.8652.6145.0049.2152.6454.5957.7460.0262.7463.9064.8570.1745.0047.7245.0039.2039.9545.0045.5546.5047.2449.5551.8756.7758.3462.1967.5345.0048.7951.8353.9057.5561.8767.2068.1345.0045.4948.3549.3950.0145.0048.2348.9050.8552.1352.8155.8856.6862.3264.9645.0048.4649.9452.2553.6856.9660.1061.4163.0767.9945.0045.8947.4648.2550.6752.6045.0048.9150.1450.8755.5958.5960.1563.6964.9468.4045.0046.0547.3051.2753.3255.6558.2745.0043.1745.0048.3048.9352.6654.2357.6160.7263.6945.0049.4545.0045.8943.2343.6941.1140.2940.9941.6635.6136.0445.0046.9449.1245.0046.7548.9345.0045.0047.0447.8950.0053.0756.8958.1661.3063.2845.0045.0045.4739.1139.7836.0736.6232.9230.2128.1728.4845.0046.3346.8949.1250.4152.4354.3555.2456.6961.6245.0047.2049.0749.7551.2151.9455.4958.0860.2864.6345.0046.1046.8248.0845.0045.8547.1947.6749.7451.1052.8155.1955.9958.6345.0045.6748.9849.6951.9154.0455.4556.8059.5661.3945.0046.0850.2651.9752.5653.7345.0048.2849.1151.5254.5756.1859.4161.7363.6267.6945.0046.8048.0850.2050.7354.4458.5859.6060.9162.9145.0045.8846.3844.1845.0048.6452.2953.6156.8557.8359.3761.8965.9766.8445.0048.4845.0046.4248.0252.7655.0358.3461.0763.4364.2568.5945.0041.0241.6342.2840.7238.9935.7336.3331.4831.9045.0046.7449.5250.8152.3657.1759.0361.1563.4764.7345.0046.1345.0045.9345.0047.1248.7145.0042.1942.9538.6936.8937.4137.8238.5034.0230.6445.0049.2750.4851.2051.8154.3256.2958.6360.0562.7545.0046.8348.0349.3753.2857.9559.7960.4462.3865.7445.0049.3352.6654.7157.9063.1565.8469.1870.3173.87 to numeric

## Bar and Pie Charts

In [None]:
# Generate a bar plot showing the total number of mice for each treatment throughout the course of the study using pandas. 



In [None]:
# Generate a bar plot showing the total number of mice for each treatment throughout the course of the study using pyplot.



In [None]:
# Generate a pie plot showing the distribution of female versus male mice using pandas



In [None]:
# Generate a pie plot showing the distribution of female versus male mice using pyplot



## Quartiles, Outliers and Boxplots

In [None]:
# Calculate the final tumor volume of each mouse across four of the treatment regimens:  
# Capomulin, Ramicane, Infubinol, and Ceftamin

# Start by getting the last (greatest) timepoint for each mouse


# Merge this group df with the original dataframe to get the tumor volume at the last timepoint


In [None]:
# Put treatments into a list for for loop (and later for plot labels)


# Create empty list to fill with tumor vol data (for plotting)


# Calculate the IQR and quantitatively determine if there are any potential outliers. 

    
    # Locate the rows which contain mice on each drug and get the tumor volumes
    
    
    # add subset 
    
    
    # Determine outliers using upper and lower bounds
    

In [None]:
# Generate a box plot of the final tumor volume of each mouse across four regimens of interest


## Line and Scatter Plots

In [None]:
# Generate a line plot of time point versus tumor volume for a mouse treated with Capomulin


In [None]:
# Generate a scatter plot of mouse weight versus average tumor volume for the Capomulin regimen


## Correlation and Regression

In [None]:
# Calculate the correlation coefficient and linear regression model 
# for mouse weight and average tumor volume for the Capomulin regimen
