# Download glove embeddings

In [10]:
import numpy as np
import pickle
import os

def convert_glove_to_embeddings(glove_file, output_dir):
    # Create output directory if it doesn't exist
    os.makedirs(output_dir, exist_ok=True)

    word_to_idx = {}
    embeddings = []

    # Print the file path for debugging
    print(f"Trying to open: {glove_file}")

    try:
        with open(glove_file, 'r', encoding='utf-8') as f:
            for idx, line in enumerate(f):
                values = line.split()
                word = values[0]
                vector = np.array(values[1:], dtype='float32')
                word_to_idx[word] = idx
                embeddings.append(vector)

        # Convert embeddings list to a NumPy array
        embeddings = np.array(embeddings)

        # Save the embeddings and word_to_idx
        np.save(os.path.join(output_dir, 'embeddings.npy'), embeddings)
        with open(os.path.join(output_dir, 'word_to_idx.pkl'), 'wb') as f:
            pickle.dump(word_to_idx, f)

        print(f"Saved embeddings to {output_dir}/embeddings.npy and word_to_idx to {output_dir}/word_to_idx.pkl")
    
    except FileNotFoundError as e:
        print(f"Error: {e}")

# Example usage
convert_glove_to_embeddings('../data/glove.6B.200d.txt', '../data/')

Trying to open: ../data/glove.6B.200d.txt
Saved embeddings to ../data//embeddings.npy and word_to_idx to ../data//word_to_idx.pkl
