# NotebookLM-Kokoro TTS Project

This notebook implements the functionality for generating audio from PDF documents using the Kokoro TTS model. It includes installation steps, GPU support configuration, and audio generation functionality.

In [None]:
# Install necessary packages
!pip install -q kokoro>=0.9.2 soundfile torch PyPDF2 numpy openai gradio

# Check if GPU is available
import torch
if torch.cuda.is_available():
    print("GPU is available.")
else:
    print("GPU is not available. Using CPU instead.")

In [None]:
# Import necessary modules
import os
import tempfile
import shutil
import numpy as np
import soundfile as sf
import ast
from notebook_lm_kokoro import generate_podcast_script, generate_audio_from_script
from notebook_lm_kokoro import KPipeline

# Set OpenAI API key
os.environ['OPENAI_API_KEY'] = 'your_api_key_here'
# Uncomment the following line if using OpenRouter
# os.environ['OPENROUTER_API_BASE'] = 'https://openrouter.ai/api/v1'

In [None]:
# Function to generate audio from a PDF file
def generate_audio_from_pdf(pdf_path, speaker1_voice='af_heart', speaker2_voice='af_nicole'):
    # Generate transcript from PDF
    transcript, _ = generate_podcast_script(pdf_path)
    if transcript is None:
        print("Error generating transcript.")
        return
    
    # Define output audio file path
    audio_output_path = pdf_path.replace('.pdf', '_audio.wav')
    
    # Generate audio from the transcript
    result = generate_audio_from_script(transcript, audio_output_path)
    if result is None:
        print("Error generating audio.")
    else:
        print(f"Audio generated and saved as: {audio_output_path}")

# Example usage
pdf_file_path = '/path/to/your/pdf_file.pdf'  # Change this to your PDF file path
generate_audio_from_pdf(pdf_file_path)