In [1]:
from pptx import Presentation
from pptx.util import Inches

# Create a presentation object
prs = Presentation()

# Title Slide
slide_layout = prs.slide_layouts[0]
slide = prs.slides.add_slide(slide_layout)
title = slide.shapes.title
subtitle = slide.placeholders[1]
title.text = "2015 U.S. Flight Delay Prediction"
subtitle.text = "Using LightGBM, Random Forest, and Neural Networks\nAzadeh Ansari\nAugust 1, 2024"

# Introduction Slide
slide_layout = prs.slide_layouts[1]
slide = prs.slides.add_slide(slide_layout)
title = slide.shapes.title
content = slide.placeholders[1]
title.text = "Introduction"
content.text = "Overview of the Flight Delay data\nImportance of predicting delay amount"

# Data Description Slide
slide = prs.slides.add_slide(slide_layout)
title = slide.shapes.title
content = slide.placeholders[1]
title.text = "Data Description"
content.text = "Description of the dataset\nFeatures: Day of the week, Month, Scheduled Arrival Time, Scheduled Departure Time, Taxi In, Taxi Out, Airline, etc."

# Methodology Slide
slide = prs.slides.add_slide(slide_layout)
title = slide.shapes.title
content = slide.placeholders[1]
title.text = "Methodology"
content.text = "Data Preprocessing: Cleaning, Feature Engineering, Normalization\nModels Used: LightGBM, Random Forest, Neural Networks"

# Evaluation Metrics Slide
slide = prs.slides.add_slide(slide_layout)
title = slide.shapes.title
content = slide.placeholders[1]
title.text = "Evaluation Metrics"
content.text = "RMSE\nComputational Time"

# EDA Slide
slide = prs.slides.add_slide(slide_layout)
title = slide.shapes.title
content = slide.placeholders[1]
title.text = "Explanatory Data Analysis"
content.text = "Average Total Delay per Airline"
slide.shapes.add_picture("../figures/average_total_delay_by_airline.png", Inches(1), Inches(2.5), width=Inches(4.5))
# slide.shapes.add_picture("../figures/Logistic_Regression_precision_recall_curve.png", Inches(6), Inches(2.5), width=Inches(4.5))

# EDA Slide
slide = prs.slides.add_slide(slide_layout)
title = slide.shapes.title
content = slide.placeholders[1]
title.text = "Explanatory Data Analysis"
content.text = "Average Total Delay per Airline"
slide.shapes.add_picture("../figures/average_departure_delay_by_origin_airport.png", Inches(1), Inches(2.5), width=Inches(4.5))

# EDA Slide
slide = prs.slides.add_slide(slide_layout)
title = slide.shapes.title
content = slide.placeholders[1]
title.text = "Explanatory Data Analysis"
content.text = "Total Delay per Day of the Week"
slide.shapes.add_picture("../figures/delay_by_day_of_week.png", Inches(1), Inches(2.5), width=Inches(4.5))

# EDA Slide
slide = prs.slides.add_slide(slide_layout)
title = slide.shapes.title
content = slide.placeholders[1]
title.text = "Explanatory Data Analysis"
content.text = "Departure/Arrival Delay Distribution"
slide.shapes.add_picture("../figures/departure_delay_dist.png", Inches(1), Inches(2.5), width=Inches(4.5))
slide.shapes.add_picture("../figures/arrival_delay_distribution.png", Inches(6), Inches(2.5), width=Inches(4.5))

# EDA Slide
slide = prs.slides.add_slide(slide_layout)
title = slide.shapes.title
content = slide.placeholders[1]
title.text = "Explanatory Data Analysis"
content.text = "Total Delay Distribution"
slide.shapes.add_picture("../figures/total_delay_distribution.png", Inches(1), Inches(2.5), width=Inches(4.5))

# Comparison of Models Slide
slide = prs.slides.add_slide(slide_layout)
title = slide.shapes.title
content = slide.placeholders[1]
title.text = "Comparison of Models"
content.text = "RMSE on Test Data Set"

# Conclusion Slide
slide = prs.slides.add_slide(slide_layout)
title = slide.shapes.title
content = slide.placeholders[1]
title.text = "Conclusion"
content.text = "Summary of findings\nBest performing model\nLightGBM outperforms other models."

# Save the presentation
prs.save('Flight_Delay_Prediction.pptx')
