In [None]:
from pathlib import Path
import os
import sys

try:
    from google.colab import drive

    drive.mount("/content/drive", force_remount=True)
    ROOT = Path("/content/drive/MyDrive/textbook-topic-analysis")
    os.chdir(str(ROOT))  # Change the working directory for file operations
    sys.path.append(str(ROOT))  # Add the directory to sys.path for imports
except ImportError:
    ROOT = Path(".")

In [None]:
%%capture
! pip install -r {str(ROOT / "requirements.txt")}

In [None]:
from textbooks.data import Textbook
from pathlib import Path

base_textbook = Textbook.from_json(
    Path("textbooks-parsed/2012_Book_ModernMathematicalStatisticsWi.json")
)

other_textbooks = [
    Textbook.from_json(Path("textbooks-parsed/Walpole_Probability_and_Statistics.json"))
]

# Top2Vec

In [None]:
import numpy as np

from computations.top2vec import top2vec_integration
from evaluation.grid_search import tune_parameters
from textbooks.utils import extract_concept_definition, extract_content

parameter_tuning = {
    "Top2Vec": {
        "fn": top2vec_integration,
        "text_extraction_fn": {
            "content": extract_content,
            "concept definitions": extract_concept_definition,
        },
        "similarity_threshold": [0.6, 0.7, .8, 0.9],
    }
}

tune_parameters(
    base_textbook,
    other_textbooks,
    parameter_tuning,
    "evaluation-data/colab-results.json",
)