In [1]:
from IPython.display import display, HTML
from datetime import datetime

# Define the notebook title
Notebook_title = "scRNA Lethal Covid19 Analysis"

# Get the current date
current_date = datetime.now().strftime("%B %d, %Y")

# Create the HTML string with title, date, and author
html_content = f"""
<h1 style="text-align:center;">{Notebook_title}</h1>
<br/>
<h3 style="text-align:left;">MikiasHWT</h3>
<h3 style="text-align:left;">{current_date}</h3>
"""

# Display the HTML content in the output
display(HTML(html_content))


# Background
As of November 2024, the [World health Organization](https://data.who.int/dashboards/covid19/cases) reported 777 million (103 million in the US) confirmed cases of severe acute respiratory syndrome coronavirus 2 (SARS-CoV-2) worldwide, with over 7 million deaths (1.2 million in the US). This coronavirus, commonly known as COVID-19, has had a profound impact on global health, economies, and societies.In this project, I aim to replicate the analyses from the paper ["A molecular single-cell lung atlas of lethal COVID-19"](https://www.nature.com/articles/s41586-021-03569-1#data-availability). 

The original paper provides an in-depth examination of the cellular and molecular alterations in the lungs of individuals who died of COVID-19, utilizing single-nucleus RNA sequencing to analyze lung tissue from 19 patients (12M, 7F, mediage age 72) who died of COVID-19 and biopsy or resection samples from 7 pre-pandemic controls (4M, 3F, median age 70).

## Objectives
By replicating the various analyses performed by the original authors, I intend to recapitulate the original findings and further explore the pathophysiology of lethal COVID-19. 

This will include:
- Process single-cell RNA sequencing data using sensible quality control metrics.
- Cluster and integrate immune cell populations between healthy and COVID-19 samples. 
- Identify and label immune cell using gene expression profiles and activation states
- Characterize differences in cell infilitration, proportions and activation states between healthy and COVID-19 samples. 

The ultimate goal of this project is to enhance my understanding of the cellular and molecular mechanisms underlying severe COVID-19.

# Prep Workplace

## Import Libraries

In [5]:
import numpy as np
import pandas as pd
import os 

## Directories

In [None]:
# Define directories 
datDir = os.path.abspath("data")
outDir = os.path.abspath("output")

# List their contents. 
for path in [datDir, outDir]:
    # os.makedirs(path, exist_ok=True)   # Optional: Create directories if they dont exist
    print(f"Contents of {path}:")
    print("\n".join(os.listdir(path)) or "Directory is empty", "\n")

Contents of c:\Users\Owner\Documents\GitHub\scRNA_Lethal_Covid19_Analysis\data:
GSE171524_RAW.tar 

Contents of c:\Users\Owner\Documents\GitHub\scRNA_Lethal_Covid19_Analysis\output:
Directory is empty 



# Background

## Motivation

## Data Source

# Import Data

# Wrangle Data

explain

# Explore Data

explain

# Analyze Data

explain

# Conclusions

## Discoveries

explain

## Future Directions

explain

# End

## Show Session Information

In [8]:
import session_info
session_info.show()

## Save Session Requirements

In [9]:
# Replace spaces in notebook title with underscores
filename = Notebook_title.replace(" ", "_") + "_requirements.txt"

# Run the pip freeze command and save the output txt file
!pip freeze > $filename