# DeepSeek-R1 Training and Fine-tuning

This notebook provides comprehensive training and fine-tuning capabilities for DeepSeek-R1 models.

## Features:
- Download and configure DeepSeek-R1 models
- Create reasoning datasets for fine-tuning
- Fine-tune DeepSeek-R1 distilled models
- Integrate with brain simulation framework
- Monitor training progress and performance

---


In [None]:
# Setup and imports
import sys
import os
import torch
import json
import numpy as np
import matplotlib.pyplot as plt
from datetime import datetime
from typing import Dict, List, Any, Optional
from pathlib import Path

# Transformers and training libraries
from transformers import (
    AutoTokenizer, 
    AutoModelForCausalLM,
    TrainingArguments,
    Trainer,
    DataCollatorForLanguageModeling
)
from datasets import Dataset, load_dataset
from accelerate import Accelerator

# Add project paths
sys.path.append('../../src')
sys.path.append('../../database')

# Configure matplotlib
%matplotlib inline
plt.style.use('seaborn-v0_8')

print("🧠 DeepSeek-R1 Training Environment")
print(f"🔧 PyTorch version: {torch.__version__}")
print(f"🚀 CUDA available: {torch.cuda.is_available()}")
if torch.cuda.is_available():
    print(f"📱 GPU: {torch.cuda.get_device_name(0)}")
    print(f"💾 GPU Memory: {torch.cuda.get_device_properties(0).total_memory // 1024**3} GB")
