In [None]:
# Cell 1: Import libraries and setup model directory
from pathlib import Path
from transformers import (
    WhisperProcessor, WhisperForConditionalGeneration,
    Wav2Vec2ForCTC, Wav2Vec2Processor,
    Wav2Vec2CTCTokenizer, Wav2Vec2FeatureExtractor,
    AutoModelForPreTraining
)

# Set model directory path
PROJECT_ROOT = Path(__file__).resolve().parents[1] if "__file__" in globals() else Path.cwd().parents[1]
MODEL_DIR = PROJECT_ROOT / "models"
MODEL_DIR.mkdir(parents=True, exist_ok=True)

print(f"✅ Model directory: {MODEL_DIR}")


✅ Model directory: ../models


In [None]:
# Cell 2: Download Whisper-small (Multilingual ASR)
WHISPER_NAME = "openai/whisper-small"
WHISPER_PATH = MODEL_DIR / "whisper-small"

whisper_model = WhisperForConditionalGeneration.from_pretrained(
    WHISPER_NAME, cache_dir=str(WHISPER_PATH)
)
whisper_processor = WhisperProcessor.from_pretrained(
    WHISPER_NAME, cache_dir=str(WHISPER_PATH)
)

print("✅ Whisper-small downloaded.")


config.json:   0%|          | 0.00/1.97k [00:00<?, ?B/s]

To support symlinks on Windows, you either need to activate Developer Mode or to run Python as an administrator. In order to activate developer mode, see this article: https://docs.microsoft.com/en-us/windows/apps/get-started/enable-your-device-for-development


model.safetensors:   0%|          | 0.00/967M [00:00<?, ?B/s]

generation_config.json:   0%|          | 0.00/3.87k [00:00<?, ?B/s]

preprocessor_config.json:   0%|          | 0.00/185k [00:00<?, ?B/s]

tokenizer_config.json:   0%|          | 0.00/283k [00:00<?, ?B/s]

vocab.json:   0%|          | 0.00/836k [00:00<?, ?B/s]

tokenizer.json:   0%|          | 0.00/2.48M [00:00<?, ?B/s]

merges.txt:   0%|          | 0.00/494k [00:00<?, ?B/s]

normalizer.json:   0%|          | 0.00/52.7k [00:00<?, ?B/s]

added_tokens.json:   0%|          | 0.00/34.6k [00:00<?, ?B/s]

special_tokens_map.json:   0%|          | 0.00/2.19k [00:00<?, ?B/s]

✅ Whisper-small downloaded.


In [None]:
# Cell 3: Download Wav2Vec2-Turkish (fine-tuned)
W2V2_TURKISH_NAME = "ceyda/wav2vec2-large-xlsr-53-turkish"
W2V2_TURKISH_PATH = MODEL_DIR / "wav2vec2-turkish"

w2v2_tr_model = Wav2Vec2ForCTC.from_pretrained(
    W2V2_TURKISH_NAME, cache_dir=str(W2V2_TURKISH_PATH)
)
w2v2_tr_processor = Wav2Vec2Processor.from_pretrained(
    W2V2_TURKISH_NAME, cache_dir=str(W2V2_TURKISH_PATH)
)

print("✅ Wav2Vec2-Turkish downloaded.")


config.json:   0%|          | 0.00/1.57k [00:00<?, ?B/s]

To support symlinks on Windows, you either need to activate Developer Mode or to run Python as an administrator. In order to activate developer mode, see this article: https://docs.microsoft.com/en-us/windows/apps/get-started/enable-your-device-for-development


pytorch_model.bin:   0%|          | 0.00/1.26G [00:00<?, ?B/s]

preprocessor_config.json:   0%|          | 0.00/158 [00:00<?, ?B/s]

tokenizer_config.json:   0%|          | 0.00/138 [00:00<?, ?B/s]

vocab.json:   0%|          | 0.00/339 [00:00<?, ?B/s]

special_tokens_map.json:   0%|          | 0.00/85.0 [00:00<?, ?B/s]

✅ Wav2Vec2-Turkish downloaded.


In [None]:
# Cell 4: Download Wav2Vec2-Base (Multilingual, no tokenizer)
W2V2_BASE_MODEL = "facebook/wav2vec2-large-xlsr-53"
W2V2_BASE_PATH = MODEL_DIR / "wav2vec2-base"

feature_extractor = Wav2Vec2FeatureExtractor.from_pretrained(
    W2V2_BASE_MODEL, cache_dir=str(W2V2_BASE_PATH)
)

w2v2_base_model = AutoModelForPreTraining.from_pretrained(
    W2V2_BASE_MODEL, cache_dir=str(W2V2_BASE_PATH)
)

print("✅ Wav2Vec2-Base downloaded successfully (without tokenizer)")


✅ Wav2Vec2-Base downloaded successfully (without tokenizer)


model.safetensors:   0%|          | 0.00/1.27G [00:00<?, ?B/s]