<a href="https://colab.research.google.com/github/tsenga2/boj-meeting-analysis/blob/main/main.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [None]:
# 1. Mount Google Drive
from google.colab import drive
drive.mount('/content/drive')

In [None]:
# 2. Clone the repository
!git clone https://github.com/tsenga2/boj-meeting-analysis.git
%cd boj-meeting-analysis

In [None]:
# 3. Install required packages
!apt-get update
!apt-get install -y tesseract-ocr tesseract-ocr-jpn poppler-utils mecab libmecab-dev mecab-ipadic-utf8
!pip install pdf2image pytesseract mecab-python3 yfinance pandas-datareader scikit-learn numpy pandas matplotlib seaborn requests beautifulsoup4 lxml tqdm

In [None]:
# 4. Run the analysis (import from main.py and set Google Drive paths)
import os
import sys
sys.path.append('.')
from main import get_boj_meeting_dates, download_boj_press_conferences, download_boj_pdfs, extract_boj_minutes_text, analyze_meeting_texts, fetch_market_data, calculate_inter_meeting_stats, combine_text_and_market_analysis, analyze_similarity_market_relationship

# Set paths to Google Drive
BASE_DIR = '/content/drive/MyDrive/BOJ_Analysis'
PDF_DIR = os.path.join(BASE_DIR, 'pdfs')
OUTPUT_DIR = os.path.join(BASE_DIR, 'output')

# Create directories
for directory in [BASE_DIR, PDF_DIR, OUTPUT_DIR]:
    os.makedirs(directory, exist_ok=True)



In [None]:
# Run analysis steps
print("Step 1: Get BOJ meeting dates")
meeting_dates = get_boj_meeting_dates()



In [None]:
print("Step 2: Download BOJ meeting PDFs")
download_boj_pdfs(range(2006,2010))  # Adjust year range as needed
download_boj_press_conferences(2010, 2024)



In [None]:
print("Step 3: Analyze meeting texts")
#text_df = analyze_meeting_texts(pdf_dir=PDF_DIR, max_pages=1)
text_df = extract_boj_minutes_text()

In [None]:
print("Step 4: Fetch market data")
market_data = fetch_market_data()



In [None]:
print("Step 5: Calculate market statistics")
market_stats = calculate_inter_meeting_stats(market_data, meeting_dates)



In [None]:
print("Step 6: Combine analyses")
combined_df = combine_text_and_market_analysis(text_df, market_stats)



In [None]:
print("Step 7: Analyze relationship")
correlation_df, group_stats = analyze_similarity_market_relationship(combined_df)

print("Analysis complete!")