# Data Analysis Notebook

This notebook is designed to run in Google Colab. It will clone the repository to your Google Drive and run the analysis.

In [None]:
# Mount Google Drive
from google.colab import drive
drive.mount('/content/drive')

In [None]:
# Clone Repository
import os

# Replace with your actual repository URL
REPO_URL = "YOUR_REPO_URL_HERE"
REPO_NAME = REPO_URL.split("/")[-1].replace(".git", "")

if not os.path.exists(f"/content/drive/MyDrive/{REPO_NAME}"):
    %cd /content/drive/MyDrive
    !git clone {REPO_URL}
    %cd {REPO_NAME}
else:
    %cd /content/drive/MyDrive/{REPO_NAME}
    !git pull

In [None]:
# Install Dependencies
!pip install pandas numpy openpyxl plotly

# Generate Field Design

Run this cell to generate the 'plan_de_campo.xlsx' file with detailed quotas for field work.
You can adjust the parameters below.

In [None]:
# Configuration Parameters for Field Design
TARGET_SAMPLE_SIZE = 3000
N_STATES = 10
MUNIS_PER_STATE = 2

# Generate Field Design Plan
try:
    from create_field_design import main as create_design
    create_design(target_n=TARGET_SAMPLE_SIZE, n_states=N_STATES, munis_per_state=MUNIS_PER_STATE)
    print("Design file created: plan_de_campo.xlsx")
except ImportError:
    print("create_field_design.py not found. Make sure you have pulled the latest changes.")


In [None]:
# Run Analysis
import sys
import os

# Ensure the current directory is in the path
sys.path.append(os.getcwd())

from process_sample import main

if __name__ == "__main__":
    main()

In [None]:
# View Dashboard
import IPython
IPython.display.HTML(filename='dashboard.html')