In [1]:
import os, sys
sys.path.insert(0, '..')

In [2]:
import gensim
import gc
from os.path import join as j
import json
from tqdm import tqdm, trange
from models import glove, custom_trained_model, word2vec
from utils.dataset import PandasDataset
from datasets.nyt import Nyt
from utils.weat import WEAT
from sklearn.decomposition import PCA
from sklearn.discriminant_analysis import LinearDiscriminantAnalysis
from sklearn.neighbors import KNeighborsClassifier
import seaborn as sns, numpy as np, pandas as pd, random
import matplotlib.pyplot as plt
from mpl_toolkits.mplot3d import Axes3D
import warnings
warnings.filterwarnings('ignore')


gc.enable()

In [3]:
def get_bar_plot(y, pred):
    u = np.unique(y)
    classes = len(u)
    match = [0] * classes * 2
    for idx, true in enumerate(y):
        if true == pred[idx]:
            match[true] += 1
        else:
            match[true + classes] += 1
    return pd.DataFrame({'x': list(u) * 2, 'y': match, 'hue': [True] * classes + [False] * classes})

In [4]:
def plot_(x, y, colors, z=None, title="year", three=False, scale=True):
    # https://stackoverflow.com/a/60621783
    sns.set_style("whitegrid", {'axes.grid' : False})
    fig = plt.figure(figsize=(6,6))
    if three:
        ax = Axes3D(fig)
        g = ax.scatter(x, y, z, c=colors, marker='o', depthshade=False, cmap='Paired')
        if scale:
            ax.set_zlim(-1, 1)
            ax.set_xlim(-1, 1)
            ax.set_ylim(-1, 1)
        ax.set_zlabel('Z Label')
        ax.set_xlabel('X Label')
        ax.set_ylabel('Y Label')
        ax.set_title(title)
        legend = ax.legend(*g.legend_elements(), loc="lower center", borderaxespad=-10, ncol=4)
        ax.add_artist(legend)
    else:
        plt.scatter(x, y, c=colors)
        if scale:
            plt.xlim(-2, 2)
            plt.ylim(-2, 2)
        plt.title(title)
    plt.show()

In [5]:
def plot_model(model, model_title, man_words, woman_words, occupations=[]):
    
    vecs = model.transform(man_words + woman_words + occupations)
    colors = ['blue'] * len(man_words) + ['pink'] * len(woman_words) + ['green'] * len(occupations)
    
    # plot 3D graph using PCA
    three = PCA(random_state=0).fit_transform(vecs)[:, :3]
    plot_(three[:, 0], three[:, 1], z=three[:, 2], title=model_title + "_3D_PCA", three=True, scale=False, colors=colors)
    
    # plot 2 D plot using PCA
    two = PCA(random_state=0).fit_transform(vecs)[:, :2]
    plot_(two[:, 0], two[:, 1], title=model_title + "_2D_PCA", three=False, scale=False, colors=colors)
    
    
    # plot LDA
    y = np.concatenate([np.zeros(shape=len(man_words), dtype=int), np.ones(dtype=int, shape=len(woman_words)), 
                    np.full(dtype=int, shape=len(occupations), fill_value=2)]) 
    two = LinearDiscriminantAnalysis().fit_transform(vecs, y)
    
    knn = KNeighborsClassifier(n_neighbors=3)
    knn.fit(vecs, y)
    pred = knn.predict(vecs)
    df = get_bar_plot(y=y, pred=pred)
    if len(occupations):
        plot_(two[:, 0], two[:, 1], title=model_title + "_2D_LDA", three=False, scale=False, colors=colors)
    else:
        plot_(two[:, 0], y, title=model_title + "_1D_LDA", three=False, scale=False, colors=colors)
    sns.barplot(data=df, x='x', y='y', hue='hue', ).set_title(model_title + "_KNN classification")
    plt.show()
    return WEAT(model, words_json='../weat/weat.json').get_scores()

In [6]:
DIR = '/tmp/temp/'
YEARS = range(1921, 2021, 10)
EMBEDDINGS_DIR = '../trained_models/glove/embeddings_{}/'
MAN, WOMAN, OCCUPATIONS = 'Man words', 'Woman words', 'Occupations with Human Stereotype Scores'
words = json.load(open('../weat/GargWordList.json'))
words[WOMAN].remove('femen') # not sure what femen is !! 
CSV = "df_{st}_to_{end}.csv"
SCORES = np.zeros(shape=(len(YEARS), 7))
CUSTOM_MODEL_PATH = "../trained_models/GoogleNews-vectors-negative300.bin"

# GLOVE MODELS

In [7]:
for idx, y in tqdm(enumerate(YEARS)):
    dataset = DIR + CSV.format(st=y, end=y+9)
    saved_model_path = EMBEDDINGS_DIR.format(y)
    lines = Nyt(dataset).lines
    m = glove.Glove(load=False).fit(lines, glove_path='../scripts/').save(saved_model_path)

0it [00:00, ?it/s]

make: Entering directory '/home/ashutosh/study/bias_manifold/scripts'
rm -rf glove shuffle cooccur vocab_count build
make: Leaving directory '/home/ashutosh/study/bias_manifold/scripts'
make: Entering directory '/home/ashutosh/study/bias_manifold/scripts'
mkdir -p build
gcc ./glove.c -o build/glove -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic


./glove.c: In function ‘save_params’:
  249 |               if (write_header) fprintf(fout, "%ld %d\n", vocab_size, vector_size);
      |                                                ~~^        ~~~~~~~~~~
      |                                                  |        |
      |                                                  long int long long int
      |                                                %lld
./glove.c: In function ‘initialize_parameters’:
   98 |             fread(&W[a], sizeof(real), 1, fin);
      |             ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./glove.c: In function ‘glove_thread’:
  133 |         fread(&cr, sizeof(CREC), 1, fin);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~


gcc ./shuffle.c -o build/shuffle -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic
gcc ./cooccur.c -o build/cooccur -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic


./shuffle.c: In function ‘shuffle_merge’:
  107 |                 fread(&array[i], sizeof(CREC), 1, fid[j]);
      |                 ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./shuffle.c: In function ‘shuffle_by_chunks’:
  165 |         fread(&array[i], sizeof(CREC), 1, fin);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./cooccur.c: In function ‘merge_files’:
  267 |         fread(&new, sizeof(CREC), 1, fid[i]);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
  277 |     fread(&new, sizeof(CREC), 1, fid[i]);
      |     ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
  290 |         fread(&new, sizeof(CREC), 1, fid[i]);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~


gcc ./vocab_count.c -o build/vocab_count -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic
make: Leaving directory '/home/ashutosh/study/bias_manifold/scripts'


BUILDING VOCABULARY


Processed 0 tokens.[11G100000 tokens.[11G200000 tokens.[11G300000 tokens.[11G400000 tokens.[11G500000 tokens.[11G600000 tokens.[11G700000 tokens.[11G800000 tokens.[11G900000 tokens.[11G1000000 tokens.[11G1100000 tokens.[11G1200000 tokens.[11G1300000 tokens.[11G1400000 tokens.[11G1500000 tokens.[11G1600000 tokens.[11G1700000 tokens.[11G1800000 tokens.[11G1900000 tokens.[11G2000000 tokens.[11G2100000 tokens.[11G2200000 tokens.[11G2300000 tokens.[11G2400000 tokens.[11G2500000 tokens.[11G2600000 tokens.[11G2700000 tokens.[11G2800000 tokens.[11G2900000 tokens.[11G3000000 tokens.[11G3100000 tokens.[11G3200000 tokens.[11G3300000 tokens.[11G3400000 tokens.[11G3500000 tokens.[11G3600000 tokens.[11G3700000 tokens.[11G3800000 tokens.[11G3900000 tokens.[11G4000000 tokens.[11G4100000 tokens.[11G4200000 tokens.[11G4300000 tokens.[11G4400000 tokens.[11G4500000 tokens.[11G4600000 tokens.[11G4700000 tokens.[11G4800000 tokens.[11G4900000 tokens.[11G50000

[11G44500000 tokens.[11G44600000 tokens.[11G44700000 tokens.[11G44800000 tokens.[11G44900000 tokens.[11G45000000 tokens.[11G45100000 tokens.[11G45200000 tokens.[11G45300000 tokens.[11G45400000 tokens.[11G45500000 tokens.[11G45600000 tokens.[11G45700000 tokens.[11G45800000 tokens.[11G45900000 tokens.[11G46000000 tokens.[11G46100000 tokens.[11G46200000 tokens.[11G46300000 tokens.[0GProcessed 46353529 tokens.
Counted 456483 unique words.
Truncating vocabulary at min count 5.
Using vocabulary of size 94230.

COUNTING COOCCURRENCES
window size: 8
context: symmetric
max product: 20163704
overflow length: 57042534
Reading vocab from file "/tmp/temp.vocab"...loaded 94230 words.
Building lookup table...table contains 142818143 elements.
Processing token: 0[19G100000[19G200000[19G300000[19G400000[19G500000[19G600000[19G700000[19G800000[19G900000[19G1000000[19G1100000[19G1200000[19G1300000[19G1400000[19G1500000[19G1600000[19G1700000[19G1800000[19G1900000[19

Merging cooccurrence files: processed 0 lines.[39G100000 lines.[39G200000 lines.[39G300000 lines.[39G400000 lines.[39G500000 lines.[39G600000 lines.[39G700000 lines.[39G800000 lines.[39G900000 lines.[39G1000000 lines.[39G1100000 lines.[39G1200000 lines.[39G1300000 lines.[39G1400000 lines.[39G1500000 lines.[39G1600000 lines.[39G1700000 lines.[39G1800000 lines.[39G1900000 lines.[39G2000000 lines.[39G2100000 lines.[39G2200000 lines.[39G2300000 lines.[39G2400000 lines.[39G2500000 lines.[39G2600000 lines.[39G2700000 lines.[39G2800000 lines.[39G2900000 lines.[39G3000000 lines.[39G3100000 lines.[39G3200000 lines.[39G3300000 lines.[39G3400000 lines.[39G3500000 lines.[39G3600000 lines.[39G3700000 lines.[39G3800000 lines.[39G3900000 lines.[39G4000000 lines.[39G4100000 lines.[39G4200000 lines.[39G4300000 lines.[39G4400000 lines.[39G4500000 lines.[39G4600000 lines.[39G4700000 lines.[39G4800000 lines.[39G4900000 lines.[39G5000000 lines.[39G5100000 

[39G42000000 lines.[39G42100000 lines.[39G42200000 lines.[39G42300000 lines.[39G42400000 lines.[39G42500000 lines.[39G42600000 lines.[39G42700000 lines.[39G42800000 lines.[39G42900000 lines.[39G43000000 lines.[39G43100000 lines.[39G43200000 lines.[39G43300000 lines.[39G43400000 lines.[39G43500000 lines.[39G43600000 lines.[39G43700000 lines.[39G43800000 lines.[39G43900000 lines.[39G44000000 lines.[39G44100000 lines.[39G44200000 lines.[39G44300000 lines.[39G44400000 lines.[39G44500000 lines.[39G44600000 lines.[39G44700000 lines.[39G44800000 lines.[39G44900000 lines.[39G45000000 lines.[39G45100000 lines.[39G45200000 lines.[39G45300000 lines.[39G45400000 lines.[39G45500000 lines.[39G45600000 lines.[39G45700000 lines.[39G45800000 lines.[39G45900000 lines.[39G46000000 lines.[39G46100000 lines.[39G46200000 lines.[39G46300000 lines.[39G46400000 lines.[39G46500000 lines.[39G46600000 lines.[39G46700000 lines.[39G46800000 lines.[39G46900000 lines.

make: Entering directory '/home/ashutosh/study/bias_manifold/scripts'
rm -rf glove shuffle cooccur vocab_count build
make: Leaving directory '/home/ashutosh/study/bias_manifold/scripts'
make: Entering directory '/home/ashutosh/study/bias_manifold/scripts'
mkdir -p build
gcc ./glove.c -o build/glove -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic


./glove.c: In function ‘save_params’:
  249 |               if (write_header) fprintf(fout, "%ld %d\n", vocab_size, vector_size);
      |                                                ~~^        ~~~~~~~~~~
      |                                                  |        |
      |                                                  long int long long int
      |                                                %lld
./glove.c: In function ‘initialize_parameters’:
   98 |             fread(&W[a], sizeof(real), 1, fin);
      |             ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./glove.c: In function ‘glove_thread’:
  133 |         fread(&cr, sizeof(CREC), 1, fin);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~


gcc ./shuffle.c -o build/shuffle -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic
gcc ./cooccur.c -o build/cooccur -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic


./shuffle.c: In function ‘shuffle_merge’:
  107 |                 fread(&array[i], sizeof(CREC), 1, fid[j]);
      |                 ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./shuffle.c: In function ‘shuffle_by_chunks’:
  165 |         fread(&array[i], sizeof(CREC), 1, fin);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./cooccur.c: In function ‘merge_files’:
  267 |         fread(&new, sizeof(CREC), 1, fid[i]);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
  277 |     fread(&new, sizeof(CREC), 1, fid[i]);
      |     ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
  290 |         fread(&new, sizeof(CREC), 1, fid[i]);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~


gcc ./vocab_count.c -o build/vocab_count -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic
make: Leaving directory '/home/ashutosh/study/bias_manifold/scripts'


BUILDING VOCABULARY


Processed 0 tokens.[11G100000 tokens.[11G200000 tokens.[11G300000 tokens.[11G400000 tokens.[11G500000 tokens.[11G600000 tokens.[11G700000 tokens.[11G800000 tokens.[11G900000 tokens.[11G1000000 tokens.[11G1100000 tokens.[11G1200000 tokens.[11G1300000 tokens.[11G1400000 tokens.[11G1500000 tokens.[11G1600000 tokens.[11G1700000 tokens.[11G1800000 tokens.[11G1900000 tokens.[11G2000000 tokens.[11G2100000 tokens.[11G2200000 tokens.[11G2300000 tokens.[11G2400000 tokens.[11G2500000 tokens.[11G2600000 tokens.[11G2700000 tokens.[11G2800000 tokens.[11G2900000 tokens.[11G3000000 tokens.[11G3100000 tokens.[11G3200000 tokens.[11G3300000 tokens.[11G3400000 tokens.[11G3500000 tokens.[11G3600000 tokens.[11G3700000 tokens.[11G3800000 tokens.[11G3900000 tokens.[11G4000000 tokens.[11G4100000 tokens.[11G4200000 tokens.[11G4300000 tokens.[11G4400000 tokens.[11G4500000 tokens.[11G4600000 tokens.[11G4700000 tokens.[11G4800000 tokens.[11G4900000 tokens.[11G50000

[11G44700000 tokens.[11G44800000 tokens.[11G44900000 tokens.[11G45000000 tokens.[11G45100000 tokens.[11G45200000 tokens.[11G45300000 tokens.[11G45400000 tokens.[11G45500000 tokens.[11G45600000 tokens.[11G45700000 tokens.[11G45800000 tokens.[11G45900000 tokens.[11G46000000 tokens.[11G46100000 tokens.[11G46200000 tokens.[11G46300000 tokens.[11G46400000 tokens.[11G46500000 tokens.[11G46600000 tokens.[11G46700000 tokens.[11G46800000 tokens.[11G46900000 tokens.[11G47000000 tokens.[11G47100000 tokens.[11G47200000 tokens.[11G47300000 tokens.[11G47400000 tokens.[11G47500000 tokens.[11G47600000 tokens.[11G47700000 tokens.[11G47800000 tokens.[11G47900000 tokens.[11G48000000 tokens.[11G48100000 tokens.[11G48200000 tokens.[11G48300000 tokens.[11G48400000 tokens.[11G48500000 tokens.[11G48600000 tokens.[11G48700000 tokens.[11G48800000 tokens.[11G48900000 tokens.[11G49000000 tokens.[11G49100000 tokens.[11G49200000 tokens.[11G49300000 tokens.[11G49400000

Processing token: 0[19G100000[19G200000[19G300000[19G400000[19G500000[19G600000[19G700000[19G800000[19G900000[19G1000000[19G1100000[19G1200000[19G1300000[19G1400000[19G1500000[19G1600000[19G1700000[19G1800000[19G1900000[19G2000000[19G2100000[19G2200000[19G2300000[19G2400000[19G2500000[19G2600000[19G2700000[19G2800000[19G2900000[19G3000000[19G3100000[19G3200000[19G3300000[19G3400000[19G3500000[19G3600000[19G3700000[19G3800000[19G3900000[19G4000000[19G4100000[19G4200000[19G4300000[19G4400000[19G4500000[19G4600000[19G4700000[19G4800000[19G4900000[19G5000000[19G5100000[19G5200000[19G5300000[19G5400000[19G5500000[19G5600000[19G5700000[19G5800000[19G5900000[19G6000000[19G6100000[19G6200000[19G6300000[19G6400000[19G6500000[19G6600000[19G6700000[19G6800000[19G6900000[19G7000000[19G7100000[19G7200000[19G7300000[19G7400000[19G7500000[19G7600000[19G7700000[19G7800000[19G7900000[19G8000000[19G8100000[19G8200000[19G8

[19G64000000[19G64100000[19G64200000[19G64300000[19G64400000[19G64500000[19G64600000[19G64700000[0GProcessed 64712082 tokens.
Writing cooccurrences to disk.........3 files in total.


Merging cooccurrence files: processed 0 lines.[39G100000 lines.[39G200000 lines.[39G300000 lines.[39G400000 lines.[39G500000 lines.[39G600000 lines.[39G700000 lines.[39G800000 lines.[39G900000 lines.[39G1000000 lines.[39G1100000 lines.[39G1200000 lines.[39G1300000 lines.[39G1400000 lines.[39G1500000 lines.[39G1600000 lines.[39G1700000 lines.[39G1800000 lines.[39G1900000 lines.[39G2000000 lines.[39G2100000 lines.[39G2200000 lines.[39G2300000 lines.[39G2400000 lines.[39G2500000 lines.[39G2600000 lines.[39G2700000 lines.[39G2800000 lines.[39G2900000 lines.[39G3000000 lines.[39G3100000 lines.[39G3200000 lines.[39G3300000 lines.[39G3400000 lines.[39G3500000 lines.[39G3600000 lines.[39G3700000 lines.[39G3800000 lines.[39G3900000 lines.[39G4000000 lines.[39G4100000 lines.[39G4200000 lines.[39G4300000 lines.[39G4400000 lines.[39G4500000 lines.[39G4600000 lines.[39G4700000 lines.[39G4800000 lines.[39G4900000 lines.[39G5000000 lines.[39G5100000 

[39G45600000 lines.[39G45700000 lines.[39G45800000 lines.[39G45900000 lines.[39G46000000 lines.[39G46100000 lines.[39G46200000 lines.[39G46300000 lines.[39G46400000 lines.[39G46500000 lines.[39G46600000 lines.[39G46700000 lines.[39G46800000 lines.[39G46900000 lines.[39G47000000 lines.[39G47100000 lines.[39G47200000 lines.[39G47300000 lines.[39G47400000 lines.[39G47500000 lines.[39G47600000 lines.[39G47700000 lines.[39G47800000 lines.[39G47900000 lines.[39G48000000 lines.[39G48100000 lines.[39G48200000 lines.[39G48300000 lines.[39G48400000 lines.[39G48500000 lines.[39G48600000 lines.[39G48700000 lines.[39G48800000 lines.[39G48900000 lines.[39G49000000 lines.[39G49100000 lines.[39G49200000 lines.[39G49300000 lines.[39G49400000 lines.[39G49500000 lines.[39G49500000 lines.[39G49600000 lines.[39G49700000 lines.[39G49800000 lines.[39G49900000 lines.[39G50000000 lines.[39G50100000 lines.[39G50200000 lines.[39G50300000 lines.[39G50400000 lines.

make: Entering directory '/home/ashutosh/study/bias_manifold/scripts'
rm -rf glove shuffle cooccur vocab_count build
make: Leaving directory '/home/ashutosh/study/bias_manifold/scripts'
make: Entering directory '/home/ashutosh/study/bias_manifold/scripts'
mkdir -p build
gcc ./glove.c -o build/glove -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic


./glove.c: In function ‘save_params’:
  249 |               if (write_header) fprintf(fout, "%ld %d\n", vocab_size, vector_size);
      |                                                ~~^        ~~~~~~~~~~
      |                                                  |        |
      |                                                  long int long long int
      |                                                %lld
./glove.c: In function ‘initialize_parameters’:
   98 |             fread(&W[a], sizeof(real), 1, fin);
      |             ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./glove.c: In function ‘glove_thread’:
  133 |         fread(&cr, sizeof(CREC), 1, fin);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~


gcc ./shuffle.c -o build/shuffle -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic
gcc ./cooccur.c -o build/cooccur -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic


./shuffle.c: In function ‘shuffle_merge’:
  107 |                 fread(&array[i], sizeof(CREC), 1, fid[j]);
      |                 ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./shuffle.c: In function ‘shuffle_by_chunks’:
  165 |         fread(&array[i], sizeof(CREC), 1, fin);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./cooccur.c: In function ‘merge_files’:
  267 |         fread(&new, sizeof(CREC), 1, fid[i]);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
  277 |     fread(&new, sizeof(CREC), 1, fid[i]);
      |     ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
  290 |         fread(&new, sizeof(CREC), 1, fid[i]);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~


gcc ./vocab_count.c -o build/vocab_count -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic
make: Leaving directory '/home/ashutosh/study/bias_manifold/scripts'


BUILDING VOCABULARY


Processed 0 tokens.[11G100000 tokens.[11G200000 tokens.[11G300000 tokens.[11G400000 tokens.[11G500000 tokens.[11G600000 tokens.[11G700000 tokens.[11G800000 tokens.[11G900000 tokens.[11G1000000 tokens.[11G1100000 tokens.[11G1200000 tokens.[11G1300000 tokens.[11G1400000 tokens.[11G1500000 tokens.[11G1600000 tokens.[11G1700000 tokens.[11G1800000 tokens.[11G1900000 tokens.[11G2000000 tokens.[11G2100000 tokens.[11G2200000 tokens.[11G2300000 tokens.[11G2400000 tokens.[11G2500000 tokens.[11G2600000 tokens.[11G2700000 tokens.[11G2800000 tokens.[11G2900000 tokens.[11G3000000 tokens.[11G3100000 tokens.[11G3200000 tokens.[11G3300000 tokens.[11G3400000 tokens.[11G3500000 tokens.[11G3600000 tokens.[11G3700000 tokens.[11G3800000 tokens.[11G3900000 tokens.[11G4000000 tokens.[11G4100000 tokens.[11G4200000 tokens.[11G4300000 tokens.[11G4400000 tokens.[11G4500000 tokens.[11G4600000 tokens.[11G4700000 tokens.[11G4800000 tokens.[11G4900000 tokens.[11G50000

[11G44500000 tokens.[11G44600000 tokens.[11G44700000 tokens.[11G44800000 tokens.[11G44900000 tokens.[11G45000000 tokens.[11G45100000 tokens.[11G45200000 tokens.[11G45300000 tokens.[11G45400000 tokens.[11G45500000 tokens.[11G45600000 tokens.[11G45700000 tokens.[11G45800000 tokens.[11G45900000 tokens.[11G46000000 tokens.[11G46100000 tokens.[11G46200000 tokens.[11G46300000 tokens.[11G46400000 tokens.[11G46500000 tokens.[11G46600000 tokens.[11G46700000 tokens.[11G46800000 tokens.[11G46900000 tokens.[11G47000000 tokens.[11G47100000 tokens.[11G47200000 tokens.[11G47300000 tokens.[11G47400000 tokens.[11G47500000 tokens.[11G47600000 tokens.[11G47700000 tokens.[11G47800000 tokens.[11G47900000 tokens.[11G48000000 tokens.[11G48100000 tokens.[11G48200000 tokens.[11G48300000 tokens.[11G48400000 tokens.[11G48500000 tokens.[11G48600000 tokens.[11G48700000 tokens.[11G48800000 tokens.[11G48900000 tokens.[11G49000000 tokens.[11G49100000 tokens.[11G49200000

Processing token: 0[19G100000[19G200000[19G300000[19G400000[19G500000[19G600000[19G700000[19G800000[19G900000[19G1000000[19G1100000[19G1200000[19G1300000[19G1400000[19G1500000[19G1600000[19G1700000[19G1800000[19G1900000[19G2000000[19G2100000[19G2200000[19G2300000[19G2400000[19G2500000[19G2600000[19G2700000[19G2800000[19G2900000[19G3000000[19G3100000[19G3200000[19G3300000[19G3400000[19G3500000[19G3600000[19G3700000[19G3800000[19G3900000[19G4000000[19G4100000[19G4200000[19G4300000[19G4400000[19G4500000[19G4600000[19G4700000[19G4800000[19G4900000[19G5000000[19G5100000[19G5200000[19G5300000[19G5400000[19G5500000[19G5600000[19G5700000[19G5800000[19G5900000[19G6000000[19G6100000[19G6200000[19G6300000[19G6400000[19G6500000[19G6600000[19G6700000[19G6800000[19G6900000[19G7000000[19G7100000[19G7200000[19G7300000[19G7400000[19G7500000[19G7600000[19G7700000[19G7800000[19G7900000[19G8000000[19G8100000[19G8200000[19G8

Merging cooccurrence files: processed 0 lines.[39G100000 lines.[39G200000 lines.[39G300000 lines.[39G400000 lines.[39G500000 lines.[39G600000 lines.[39G700000 lines.[39G800000 lines.[39G900000 lines.[39G1000000 lines.[39G1100000 lines.[39G1200000 lines.[39G1300000 lines.[39G1400000 lines.[39G1500000 lines.[39G1600000 lines.[39G1700000 lines.[39G1800000 lines.[39G1900000 lines.[39G2000000 lines.[39G2100000 lines.[39G2200000 lines.[39G2300000 lines.[39G2400000 lines.[39G2500000 lines.[39G2600000 lines.[39G2700000 lines.[39G2800000 lines.[39G2900000 lines.[39G3000000 lines.[39G3100000 lines.[39G3200000 lines.[39G3300000 lines.[39G3400000 lines.[39G3500000 lines.[39G3600000 lines.[39G3700000 lines.[39G3800000 lines.[39G3900000 lines.[39G4000000 lines.[39G4100000 lines.[39G4200000 lines.[39G4300000 lines.[39G4400000 lines.[39G4500000 lines.[39G4600000 lines.[39G4700000 lines.[39G4800000 lines.[39G4900000 lines.[39G5000000 lines.[39G5100000 

[39G42800000 lines.[39G42900000 lines.[39G43000000 lines.[39G43100000 lines.[39G43200000 lines.[39G43300000 lines.[39G43400000 lines.[39G43500000 lines.[39G43600000 lines.[39G43700000 lines.[39G43800000 lines.[39G43900000 lines.[39G44000000 lines.[39G44100000 lines.[39G44200000 lines.[39G44300000 lines.[39G44400000 lines.[39G44500000 lines.[39G44600000 lines.[39G44700000 lines.[39G44800000 lines.[39G44900000 lines.[39G45000000 lines.[39G45100000 lines.[39G45200000 lines.[39G45300000 lines.[39G45400000 lines.[39G45500000 lines.[39G45600000 lines.[39G45700000 lines.[39G45800000 lines.[39G45900000 lines.[39G46000000 lines.[39G46100000 lines.[39G46200000 lines.[39G46300000 lines.[39G46400000 lines.[39G46500000 lines.[39G46600000 lines.[39G46700000 lines.[39G46800000 lines.[39G46900000 lines.[39G47000000 lines.[39G47100000 lines.[39G47200000 lines.[39G47300000 lines.[39G47400000 lines.[39G47500000 lines.[39G47600000 lines.[39G47700000 lines.

make: Entering directory '/home/ashutosh/study/bias_manifold/scripts'
rm -rf glove shuffle cooccur vocab_count build
make: Leaving directory '/home/ashutosh/study/bias_manifold/scripts'
make: Entering directory '/home/ashutosh/study/bias_manifold/scripts'
mkdir -p build
gcc ./glove.c -o build/glove -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic


./glove.c: In function ‘save_params’:
  249 |               if (write_header) fprintf(fout, "%ld %d\n", vocab_size, vector_size);
      |                                                ~~^        ~~~~~~~~~~
      |                                                  |        |
      |                                                  long int long long int
      |                                                %lld
./glove.c: In function ‘initialize_parameters’:
   98 |             fread(&W[a], sizeof(real), 1, fin);
      |             ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./glove.c: In function ‘glove_thread’:
  133 |         fread(&cr, sizeof(CREC), 1, fin);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~


gcc ./shuffle.c -o build/shuffle -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic
gcc ./cooccur.c -o build/cooccur -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic


./shuffle.c: In function ‘shuffle_merge’:
  107 |                 fread(&array[i], sizeof(CREC), 1, fid[j]);
      |                 ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./shuffle.c: In function ‘shuffle_by_chunks’:
  165 |         fread(&array[i], sizeof(CREC), 1, fin);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./cooccur.c: In function ‘merge_files’:
  267 |         fread(&new, sizeof(CREC), 1, fid[i]);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
  277 |     fread(&new, sizeof(CREC), 1, fid[i]);
      |     ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
  290 |         fread(&new, sizeof(CREC), 1, fid[i]);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~


gcc ./vocab_count.c -o build/vocab_count -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic
make: Leaving directory '/home/ashutosh/study/bias_manifold/scripts'


BUILDING VOCABULARY


Processed 0 tokens.[11G100000 tokens.[11G200000 tokens.[11G300000 tokens.[11G400000 tokens.[11G500000 tokens.[11G600000 tokens.[11G700000 tokens.[11G800000 tokens.[11G900000 tokens.[11G1000000 tokens.[11G1100000 tokens.[11G1200000 tokens.[11G1300000 tokens.[11G1400000 tokens.[11G1500000 tokens.[11G1600000 tokens.[11G1700000 tokens.[11G1800000 tokens.[11G1900000 tokens.[11G2000000 tokens.[11G2100000 tokens.[11G2200000 tokens.[11G2300000 tokens.[11G2400000 tokens.[11G2500000 tokens.[11G2600000 tokens.[11G2700000 tokens.[11G2800000 tokens.[11G2900000 tokens.[11G3000000 tokens.[11G3100000 tokens.[11G3200000 tokens.[11G3300000 tokens.[11G3400000 tokens.[11G3500000 tokens.[11G3600000 tokens.[11G3700000 tokens.[11G3800000 tokens.[11G3900000 tokens.[11G4000000 tokens.[11G4100000 tokens.[11G4200000 tokens.[11G4300000 tokens.[11G4400000 tokens.[11G4500000 tokens.[11G4600000 tokens.[11G4700000 tokens.[11G4800000 tokens.[11G4900000 tokens.[11G50000

[11G49100000 tokens.[11G49200000 tokens.[11G49300000 tokens.[11G49400000 tokens.[11G49500000 tokens.[11G49600000 tokens.[11G49700000 tokens.[11G49800000 tokens.[11G49900000 tokens.[11G50000000 tokens.[11G50100000 tokens.[11G50200000 tokens.[11G50300000 tokens.[11G50400000 tokens.[11G50500000 tokens.[11G50600000 tokens.[11G50700000 tokens.[11G50800000 tokens.[11G50900000 tokens.[11G51000000 tokens.[11G51100000 tokens.[11G51200000 tokens.[11G51300000 tokens.[11G51400000 tokens.[11G51500000 tokens.[11G51600000 tokens.[11G51700000 tokens.[11G51800000 tokens.[11G51900000 tokens.[0GProcessed 51945254 tokens.
Counted 467139 unique words.
Truncating vocabulary at min count 5.
Using vocabulary of size 120569.

COUNTING COOCCURRENCES
window size: 8
context: symmetric
max product: 20163704
overflow length: 57042534
Reading vocab from file "/tmp/temp.vocab"...loaded 120569 words.
Building lookup table...table contains 152731731 elements.
Processing token: 0[19G100000

Merging cooccurrence files: processed 0 lines.[39G100000 lines.[39G200000 lines.[39G300000 lines.[39G400000 lines.[39G500000 lines.[39G600000 lines.[39G700000 lines.[39G800000 lines.[39G900000 lines.[39G1000000 lines.[39G1100000 lines.[39G1200000 lines.[39G1300000 lines.[39G1400000 lines.[39G1500000 lines.[39G1600000 lines.[39G1700000 lines.[39G1800000 lines.[39G1900000 lines.[39G2000000 lines.[39G2100000 lines.[39G2200000 lines.[39G2300000 lines.[39G2400000 lines.[39G2500000 lines.[39G2600000 lines.[39G2700000 lines.[39G2800000 lines.[39G2900000 lines.[39G3000000 lines.[39G3100000 lines.[39G3200000 lines.[39G3300000 lines.[39G3400000 lines.[39G3500000 lines.[39G3600000 lines.[39G3700000 lines.[39G3800000 lines.[39G3900000 lines.[39G4000000 lines.[39G4100000 lines.[39G4200000 lines.[39G4300000 lines.[39G4400000 lines.[39G4500000 lines.[39G4600000 lines.[39G4700000 lines.[39G4800000 lines.[39G4900000 lines.[39G5000000 lines.[39G5100000 

[39G42200000 lines.[39G42300000 lines.[39G42400000 lines.[39G42500000 lines.[39G42600000 lines.[39G42700000 lines.[39G42800000 lines.[39G42900000 lines.[39G43000000 lines.[39G43100000 lines.[39G43200000 lines.[39G43300000 lines.[39G43400000 lines.[39G43500000 lines.[39G43600000 lines.[39G43700000 lines.[39G43800000 lines.[39G43900000 lines.[39G44000000 lines.[39G44100000 lines.[39G44200000 lines.[39G44300000 lines.[39G44400000 lines.[39G44500000 lines.[39G44600000 lines.[39G44700000 lines.[39G44800000 lines.[39G44900000 lines.[39G45000000 lines.[39G45100000 lines.[39G45200000 lines.[39G45300000 lines.[39G45400000 lines.[39G45500000 lines.[39G45600000 lines.[39G45700000 lines.[39G45800000 lines.[39G45900000 lines.[39G46000000 lines.[39G46100000 lines.[39G46200000 lines.[39G46300000 lines.[39G46400000 lines.[39G46500000 lines.[39G46600000 lines.[39G46700000 lines.[39G46800000 lines.[39G46900000 lines.[39G47000000 lines.[39G47100000 lines.

make: Entering directory '/home/ashutosh/study/bias_manifold/scripts'
rm -rf glove shuffle cooccur vocab_count build
make: Leaving directory '/home/ashutosh/study/bias_manifold/scripts'
make: Entering directory '/home/ashutosh/study/bias_manifold/scripts'
mkdir -p build
gcc ./glove.c -o build/glove -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic


./glove.c: In function ‘save_params’:
  249 |               if (write_header) fprintf(fout, "%ld %d\n", vocab_size, vector_size);
      |                                                ~~^        ~~~~~~~~~~
      |                                                  |        |
      |                                                  long int long long int
      |                                                %lld
./glove.c: In function ‘initialize_parameters’:
   98 |             fread(&W[a], sizeof(real), 1, fin);
      |             ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./glove.c: In function ‘glove_thread’:
  133 |         fread(&cr, sizeof(CREC), 1, fin);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./shuffle.c: In function ‘shuffle_merge’:
  107 |                 fread(&array[i], sizeof(CREC), 1, fid[j]);
      |                 ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~


gcc ./shuffle.c -o build/shuffle -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic
gcc ./cooccur.c -o build/cooccur -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic


./shuffle.c: In function ‘shuffle_by_chunks’:
  165 |         fread(&array[i], sizeof(CREC), 1, fin);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./cooccur.c: In function ‘merge_files’:
  267 |         fread(&new, sizeof(CREC), 1, fid[i]);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
  277 |     fread(&new, sizeof(CREC), 1, fid[i]);
      |     ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
  290 |         fread(&new, sizeof(CREC), 1, fid[i]);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~


gcc ./vocab_count.c -o build/vocab_count -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic
make: Leaving directory '/home/ashutosh/study/bias_manifold/scripts'


BUILDING VOCABULARY


Processed 0 tokens.[11G100000 tokens.[11G200000 tokens.[11G300000 tokens.[11G400000 tokens.[11G500000 tokens.[11G600000 tokens.[11G700000 tokens.[11G800000 tokens.[11G900000 tokens.[11G1000000 tokens.[11G1100000 tokens.[11G1200000 tokens.[11G1300000 tokens.[11G1400000 tokens.[11G1500000 tokens.[11G1600000 tokens.[11G1700000 tokens.[11G1800000 tokens.[11G1900000 tokens.[11G2000000 tokens.[11G2100000 tokens.[11G2200000 tokens.[11G2300000 tokens.[11G2400000 tokens.[11G2500000 tokens.[11G2600000 tokens.[11G2700000 tokens.[11G2800000 tokens.[11G2900000 tokens.[11G3000000 tokens.[11G3100000 tokens.[11G3200000 tokens.[11G3300000 tokens.[11G3400000 tokens.[11G3500000 tokens.[11G3600000 tokens.[11G3700000 tokens.[11G3800000 tokens.[11G3900000 tokens.[11G4000000 tokens.[11G4100000 tokens.[11G4200000 tokens.[11G4300000 tokens.[11G4400000 tokens.[11G4500000 tokens.[11G4600000 tokens.[11G4700000 tokens.[11G4800000 tokens.[11G4900000 tokens.[11G50000

[11G45800000 tokens.[11G45900000 tokens.[11G46000000 tokens.[11G46100000 tokens.[11G46200000 tokens.[11G46300000 tokens.[11G46400000 tokens.[11G46500000 tokens.[11G46600000 tokens.[11G46700000 tokens.[11G46800000 tokens.[11G46900000 tokens.[11G47000000 tokens.[11G47100000 tokens.[11G47200000 tokens.[11G47300000 tokens.[11G47400000 tokens.[11G47500000 tokens.[11G47600000 tokens.[11G47700000 tokens.[11G47800000 tokens.[11G47900000 tokens.[11G48000000 tokens.[11G48100000 tokens.[11G48200000 tokens.[11G48300000 tokens.[11G48400000 tokens.[11G48500000 tokens.[11G48600000 tokens.[11G48700000 tokens.[11G48800000 tokens.[11G48900000 tokens.[11G49000000 tokens.[11G49100000 tokens.[11G49200000 tokens.[11G49300000 tokens.[11G49400000 tokens.[11G49500000 tokens.[11G49600000 tokens.[11G49700000 tokens.[11G49800000 tokens.[11G49900000 tokens.[11G50000000 tokens.[11G50100000 tokens.[11G50200000 tokens.[11G50300000 tokens.[11G50400000 tokens.[11G50500000

Merging cooccurrence files: processed 0 lines.[39G100000 lines.[39G200000 lines.[39G300000 lines.[39G400000 lines.[39G500000 lines.[39G600000 lines.[39G700000 lines.[39G800000 lines.[39G900000 lines.[39G1000000 lines.[39G1100000 lines.[39G1200000 lines.[39G1300000 lines.[39G1400000 lines.[39G1500000 lines.[39G1600000 lines.[39G1700000 lines.[39G1800000 lines.[39G1900000 lines.[39G2000000 lines.[39G2100000 lines.[39G2200000 lines.[39G2300000 lines.[39G2400000 lines.[39G2500000 lines.[39G2600000 lines.[39G2700000 lines.[39G2800000 lines.[39G2900000 lines.[39G3000000 lines.[39G3100000 lines.[39G3200000 lines.[39G3300000 lines.[39G3400000 lines.[39G3500000 lines.[39G3600000 lines.[39G3700000 lines.[39G3800000 lines.[39G3900000 lines.[39G4000000 lines.[39G4100000 lines.[39G4200000 lines.[39G4300000 lines.[39G4400000 lines.[39G4500000 lines.[39G4600000 lines.[39G4700000 lines.[39G4800000 lines.[39G4900000 lines.[39G5000000 lines.[39G5100000 

[39G41700000 lines.[39G41800000 lines.[39G41900000 lines.[39G42000000 lines.[39G42100000 lines.[39G42200000 lines.[39G42300000 lines.[39G42400000 lines.[39G42500000 lines.[39G42600000 lines.[39G42700000 lines.[39G42800000 lines.[39G42900000 lines.[39G43000000 lines.[39G43100000 lines.[39G43200000 lines.[39G43300000 lines.[39G43400000 lines.[39G43500000 lines.[39G43600000 lines.[39G43700000 lines.[39G43800000 lines.[39G43900000 lines.[39G44000000 lines.[39G44100000 lines.[39G44200000 lines.[39G44300000 lines.[39G44400000 lines.[39G44500000 lines.[39G44600000 lines.[39G44700000 lines.[39G44800000 lines.[39G44900000 lines.[39G45000000 lines.[39G45100000 lines.[39G45200000 lines.[39G45300000 lines.[39G45400000 lines.[39G45500000 lines.[39G45600000 lines.[39G45700000 lines.[39G45800000 lines.[39G45900000 lines.[39G46000000 lines.[39G46100000 lines.[39G46200000 lines.[39G46300000 lines.[39G46400000 lines.[39G46500000 lines.[39G46600000 lines.

make: Entering directory '/home/ashutosh/study/bias_manifold/scripts'
rm -rf glove shuffle cooccur vocab_count build
make: Leaving directory '/home/ashutosh/study/bias_manifold/scripts'
make: Entering directory '/home/ashutosh/study/bias_manifold/scripts'
mkdir -p build
gcc ./glove.c -o build/glove -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic


./glove.c: In function ‘save_params’:
  249 |               if (write_header) fprintf(fout, "%ld %d\n", vocab_size, vector_size);
      |                                                ~~^        ~~~~~~~~~~
      |                                                  |        |
      |                                                  long int long long int
      |                                                %lld
./glove.c: In function ‘initialize_parameters’:
   98 |             fread(&W[a], sizeof(real), 1, fin);
      |             ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./glove.c: In function ‘glove_thread’:
  133 |         fread(&cr, sizeof(CREC), 1, fin);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~


gcc ./shuffle.c -o build/shuffle -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic
gcc ./cooccur.c -o build/cooccur -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic


./shuffle.c: In function ‘shuffle_merge’:
  107 |                 fread(&array[i], sizeof(CREC), 1, fid[j]);
      |                 ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./shuffle.c: In function ‘shuffle_by_chunks’:
  165 |         fread(&array[i], sizeof(CREC), 1, fin);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./cooccur.c: In function ‘merge_files’:
  267 |         fread(&new, sizeof(CREC), 1, fid[i]);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
  277 |     fread(&new, sizeof(CREC), 1, fid[i]);
      |     ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
  290 |         fread(&new, sizeof(CREC), 1, fid[i]);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~


gcc ./vocab_count.c -o build/vocab_count -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic
make: Leaving directory '/home/ashutosh/study/bias_manifold/scripts'


BUILDING VOCABULARY


Processed 0 tokens.[11G100000 tokens.[11G200000 tokens.[11G300000 tokens.[11G400000 tokens.[11G500000 tokens.[11G600000 tokens.[11G700000 tokens.[11G800000 tokens.[11G900000 tokens.[11G1000000 tokens.[11G1100000 tokens.[11G1200000 tokens.[11G1300000 tokens.[11G1400000 tokens.[11G1500000 tokens.[11G1600000 tokens.[11G1700000 tokens.[11G1800000 tokens.[11G1900000 tokens.[11G2000000 tokens.[11G2100000 tokens.[11G2200000 tokens.[11G2300000 tokens.[11G2400000 tokens.[11G2500000 tokens.[11G2600000 tokens.[11G2700000 tokens.[11G2800000 tokens.[11G2900000 tokens.[11G3000000 tokens.[11G3100000 tokens.[11G3200000 tokens.[11G3300000 tokens.[11G3400000 tokens.[11G3500000 tokens.[11G3600000 tokens.[11G3700000 tokens.[11G3800000 tokens.[11G3900000 tokens.[11G4000000 tokens.[11G4100000 tokens.[11G4200000 tokens.[11G4300000 tokens.[11G4400000 tokens.[11G4500000 tokens.[11G4600000 tokens.[11G4700000 tokens.[11G4800000 tokens.[11G4900000 tokens.[11G50000

[11G47300000 tokens.[11G47400000 tokens.[11G47500000 tokens.[11G47600000 tokens.[11G47700000 tokens.[11G47800000 tokens.[11G47900000 tokens.[11G48000000 tokens.[11G48100000 tokens.[11G48200000 tokens.[11G48300000 tokens.[11G48400000 tokens.[11G48500000 tokens.[11G48600000 tokens.[11G48700000 tokens.[11G48800000 tokens.[11G48900000 tokens.[11G49000000 tokens.[11G49100000 tokens.[11G49200000 tokens.[11G49300000 tokens.[11G49400000 tokens.[11G49500000 tokens.[11G49600000 tokens.[11G49700000 tokens.[11G49800000 tokens.[11G49900000 tokens.[11G50000000 tokens.[11G50100000 tokens.[11G50200000 tokens.[11G50300000 tokens.[11G50400000 tokens.[11G50500000 tokens.[11G50600000 tokens.[11G50700000 tokens.[11G50800000 tokens.[11G50900000 tokens.[11G51000000 tokens.[11G51100000 tokens.[11G51200000 tokens.[11G51300000 tokens.[11G51400000 tokens.[11G51500000 tokens.[11G51600000 tokens.[11G51700000 tokens.[11G51800000 tokens.[11G51900000 tokens.[11G52000000

Processing token: 0[19G100000[19G200000[19G300000[19G400000[19G500000[19G600000[19G700000[19G800000[19G900000[19G1000000[19G1100000[19G1200000[19G1300000[19G1400000[19G1500000[19G1600000[19G1700000[19G1800000[19G1900000[19G2000000[19G2100000[19G2200000[19G2300000[19G2400000[19G2500000[19G2600000[19G2700000[19G2800000[19G2900000[19G3000000[19G3100000[19G3200000[19G3300000[19G3400000[19G3500000[19G3600000[19G3700000[19G3800000[19G3900000[19G4000000[19G4100000[19G4200000[19G4300000[19G4400000[19G4500000[19G4600000[19G4700000[19G4800000[19G4900000[19G5000000[19G5100000[19G5200000[19G5300000[19G5400000[19G5500000[19G5600000[19G5700000[19G5800000[19G5900000[19G6000000[19G6100000[19G6200000[19G6300000[19G6400000[19G6500000[19G6600000[19G6700000[19G6800000[19G6900000[19G7000000[19G7100000[19G7200000[19G7300000[19G7400000[19G7500000[19G7600000[19G7700000[19G7800000[19G7900000[19G8000000[19G8100000[19G8200000[19G8

Merging cooccurrence files: processed 0 lines.[39G100000 lines.[39G200000 lines.[39G300000 lines.[39G400000 lines.[39G500000 lines.[39G600000 lines.[39G700000 lines.[39G800000 lines.[39G900000 lines.[39G1000000 lines.[39G1100000 lines.[39G1200000 lines.[39G1300000 lines.[39G1400000 lines.[39G1500000 lines.[39G1600000 lines.[39G1700000 lines.[39G1800000 lines.[39G1900000 lines.[39G2000000 lines.[39G2100000 lines.[39G2200000 lines.[39G2300000 lines.[39G2400000 lines.[39G2500000 lines.[39G2600000 lines.[39G2700000 lines.[39G2800000 lines.[39G2900000 lines.[39G3000000 lines.[39G3100000 lines.[39G3200000 lines.[39G3300000 lines.[39G3400000 lines.[39G3500000 lines.[39G3600000 lines.[39G3700000 lines.[39G3800000 lines.[39G3900000 lines.[39G4000000 lines.[39G4100000 lines.[39G4200000 lines.[39G4300000 lines.[39G4400000 lines.[39G4500000 lines.[39G4600000 lines.[39G4700000 lines.[39G4800000 lines.[39G4900000 lines.[39G5000000 lines.[39G5100000 

[39G41800000 lines.[39G41900000 lines.[39G42000000 lines.[39G42100000 lines.[39G42200000 lines.[39G42300000 lines.[39G42400000 lines.[39G42500000 lines.[39G42600000 lines.[39G42700000 lines.[39G42800000 lines.[39G42900000 lines.[39G43000000 lines.[39G43100000 lines.[39G43200000 lines.[39G43300000 lines.[39G43400000 lines.[39G43500000 lines.[39G43600000 lines.[39G43700000 lines.[39G43800000 lines.[39G43900000 lines.[39G44000000 lines.[39G44100000 lines.[39G44200000 lines.[39G44300000 lines.[39G44400000 lines.[39G44500000 lines.[39G44600000 lines.[39G44700000 lines.[39G44800000 lines.[39G44900000 lines.[39G45000000 lines.[39G45100000 lines.[39G45200000 lines.[39G45300000 lines.[39G45400000 lines.[39G45500000 lines.[39G45600000 lines.[39G45700000 lines.[39G45800000 lines.[39G45900000 lines.[39G46000000 lines.[39G46100000 lines.[39G46200000 lines.[39G46300000 lines.[39G46400000 lines.[39G46500000 lines.[39G46600000 lines.[39G46700000 lines.

11/18/22 - 12:57.25PM, iter: 012, cost: 0.012042
11/18/22 - 12:57.40PM, iter: 013, cost: 0.011868
11/18/22 - 12:57.56PM, iter: 014, cost: 0.011724
11/18/22 - 12:58.12PM, iter: 015, cost: 0.011592
11/18/22 - 12:58.28PM, iter: 016, cost: 0.011479
11/18/22 - 12:58.43PM, iter: 017, cost: 0.011379
11/18/22 - 12:58.59PM, iter: 018, cost: 0.011289
11/18/22 - 12:59.14PM, iter: 019, cost: 0.011207
11/18/22 - 12:59.29PM, iter: 020, cost: 0.011132
6it [35:27, 373.84s/it]

make: Entering directory '/home/ashutosh/study/bias_manifold/scripts'
rm -rf glove shuffle cooccur vocab_count build
make: Leaving directory '/home/ashutosh/study/bias_manifold/scripts'
make: Entering directory '/home/ashutosh/study/bias_manifold/scripts'
mkdir -p build
gcc ./glove.c -o build/glove -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic


./glove.c: In function ‘save_params’:
  249 |               if (write_header) fprintf(fout, "%ld %d\n", vocab_size, vector_size);
      |                                                ~~^        ~~~~~~~~~~
      |                                                  |        |
      |                                                  long int long long int
      |                                                %lld
./glove.c: In function ‘initialize_parameters’:
   98 |             fread(&W[a], sizeof(real), 1, fin);
      |             ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./glove.c: In function ‘glove_thread’:
  133 |         fread(&cr, sizeof(CREC), 1, fin);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~


gcc ./shuffle.c -o build/shuffle -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic
gcc ./cooccur.c -o build/cooccur -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic


./shuffle.c: In function ‘shuffle_merge’:
  107 |                 fread(&array[i], sizeof(CREC), 1, fid[j]);
      |                 ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./shuffle.c: In function ‘shuffle_by_chunks’:
  165 |         fread(&array[i], sizeof(CREC), 1, fin);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./cooccur.c: In function ‘merge_files’:
  267 |         fread(&new, sizeof(CREC), 1, fid[i]);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
  277 |     fread(&new, sizeof(CREC), 1, fid[i]);
      |     ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
  290 |         fread(&new, sizeof(CREC), 1, fid[i]);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~


gcc ./vocab_count.c -o build/vocab_count -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic
make: Leaving directory '/home/ashutosh/study/bias_manifold/scripts'


BUILDING VOCABULARY


Processed 0 tokens.[11G100000 tokens.[11G200000 tokens.[11G300000 tokens.[11G400000 tokens.[11G500000 tokens.[11G600000 tokens.[11G700000 tokens.[11G800000 tokens.[11G900000 tokens.[11G1000000 tokens.[11G1100000 tokens.[11G1200000 tokens.[11G1300000 tokens.[11G1400000 tokens.[11G1500000 tokens.[11G1600000 tokens.[11G1700000 tokens.[11G1800000 tokens.[11G1900000 tokens.[11G2000000 tokens.[11G2100000 tokens.[11G2200000 tokens.[11G2300000 tokens.[11G2400000 tokens.[11G2500000 tokens.[11G2600000 tokens.[11G2700000 tokens.[11G2800000 tokens.[11G2900000 tokens.[11G3000000 tokens.[11G3100000 tokens.[11G3200000 tokens.[11G3300000 tokens.[11G3400000 tokens.[11G3500000 tokens.[11G3600000 tokens.[11G3700000 tokens.[11G3800000 tokens.[11G3900000 tokens.[11G4000000 tokens.[11G4100000 tokens.[11G4200000 tokens.[11G4300000 tokens.[11G4400000 tokens.[11G4500000 tokens.[11G4600000 tokens.[11G4700000 tokens.[11G4800000 tokens.[11G4900000 tokens.[11G50000

[11G44300000 tokens.[11G44400000 tokens.[11G44500000 tokens.[11G44600000 tokens.[11G44700000 tokens.[11G44800000 tokens.[11G44900000 tokens.[11G45000000 tokens.[11G45100000 tokens.[11G45200000 tokens.[11G45300000 tokens.[11G45400000 tokens.[11G45500000 tokens.[11G45600000 tokens.[11G45700000 tokens.[11G45800000 tokens.[11G45900000 tokens.[11G46000000 tokens.[11G46100000 tokens.[11G46200000 tokens.[11G46300000 tokens.[11G46400000 tokens.[11G46500000 tokens.[11G46600000 tokens.[11G46700000 tokens.[11G46800000 tokens.[11G46900000 tokens.[11G47000000 tokens.[11G47100000 tokens.[11G47200000 tokens.[11G47300000 tokens.[11G47400000 tokens.[11G47500000 tokens.[11G47600000 tokens.[11G47700000 tokens.[11G47800000 tokens.[11G47900000 tokens.[11G48000000 tokens.[11G48100000 tokens.[11G48200000 tokens.[11G48300000 tokens.[11G48400000 tokens.[11G48500000 tokens.[11G48600000 tokens.[11G48700000 tokens.[11G48800000 tokens.[11G48900000 tokens.[11G49000000

[11G86600000 tokens.[11G86700000 tokens.[11G86800000 tokens.[11G86900000 tokens.[11G87000000 tokens.[11G87100000 tokens.[11G87200000 tokens.[11G87300000 tokens.[11G87400000 tokens.[11G87500000 tokens.[11G87600000 tokens.[11G87700000 tokens.[11G87800000 tokens.[11G87900000 tokens.[11G88000000 tokens.[11G88100000 tokens.[11G88200000 tokens.[11G88300000 tokens.[11G88400000 tokens.[11G88500000 tokens.[11G88600000 tokens.[11G88700000 tokens.[11G88800000 tokens.[11G88900000 tokens.[11G89000000 tokens.[11G89100000 tokens.[11G89200000 tokens.[11G89300000 tokens.[11G89400000 tokens.[11G89500000 tokens.[11G89600000 tokens.[11G89700000 tokens.[11G89800000 tokens.[11G89900000 tokens.[11G90000000 tokens.[11G90100000 tokens.[11G90200000 tokens.[11G90300000 tokens.[11G90400000 tokens.[11G90500000 tokens.[11G90600000 tokens.[11G90700000 tokens.[11G90800000 tokens.[11G90900000 tokens.[11G91000000 tokens.[11G91100000 tokens.[11G91200000 tokens.[11G91300000

Processing token: 0[19G100000[19G200000[19G300000[19G400000[19G500000[19G600000[19G700000[19G800000[19G900000[19G1000000[19G1100000[19G1200000[19G1300000[19G1400000[19G1500000[19G1600000[19G1700000[19G1800000[19G1900000[19G2000000[19G2100000[19G2200000[19G2300000[19G2400000[19G2500000[19G2600000[19G2700000[19G2800000[19G2900000[19G3000000[19G3100000[19G3200000[19G3300000[19G3400000[19G3500000[19G3600000[19G3700000[19G3800000[19G3900000[19G4000000[19G4100000[19G4200000[19G4300000[19G4400000[19G4500000[19G4600000[19G4700000[19G4800000[19G4900000[19G5000000[19G5100000[19G5200000[19G5300000[19G5400000[19G5500000[19G5600000[19G5700000[19G5800000[19G5900000[19G6000000[19G6100000[19G6200000[19G6300000[19G6400000[19G6500000[19G6600000[19G6700000[19G6800000[19G6900000[19G7000000[19G7100000[19G7200000[19G7300000[19G7400000[19G7500000[19G7600000[19G7700000[19G7800000[19G7900000[19G8000000[19G8100000[19G8200000[19G8

[19G64600000[19G64700000[19G64800000[19G64900000[19G65000000[19G65100000[19G65200000[19G65300000[19G65400000[19G65500000[19G65600000[19G65700000[19G65800000[19G65900000[19G66000000[19G66100000[19G66200000[19G66300000[19G66400000[19G66500000[19G66600000[19G66700000[19G66800000[19G66900000[19G67000000[19G67100000[19G67200000[19G67300000[19G67400000[19G67500000[19G67600000[19G67700000[19G67800000[19G67900000[19G68000000[19G68100000[19G68200000[19G68300000[19G68400000[19G68500000[19G68600000[19G68700000[19G68800000[19G68900000[19G69000000[19G69100000[19G69200000[19G69300000[19G69400000[19G69500000[19G69600000[19G69700000[19G69800000[19G69900000[19G70000000[19G70100000[19G70200000[19G70300000[19G70400000[19G70500000[19G70600000[19G70700000[19G70800000[19G70900000[19G71000000[19G71100000[19G71200000[19G71300000[19G71400000[19G71500000[19G71600000[19G71700000[19G71800000[19G71900000[19G72000000[19G72100000[19G7220000

Merging cooccurrence files: processed 0 lines.[39G100000 lines.[39G200000 lines.[39G300000 lines.[39G400000 lines.[39G500000 lines.[39G600000 lines.[39G700000 lines.[39G800000 lines.[39G900000 lines.[39G1000000 lines.[39G1100000 lines.[39G1200000 lines.[39G1300000 lines.[39G1400000 lines.[39G1500000 lines.[39G1600000 lines.[39G1700000 lines.[39G1800000 lines.[39G1900000 lines.[39G2000000 lines.[39G2100000 lines.[39G2200000 lines.[39G2300000 lines.[39G2400000 lines.[39G2500000 lines.[39G2600000 lines.[39G2700000 lines.[39G2800000 lines.[39G2900000 lines.[39G3000000 lines.[39G3100000 lines.[39G3200000 lines.[39G3300000 lines.[39G3400000 lines.[39G3500000 lines.[39G3600000 lines.[39G3700000 lines.[39G3800000 lines.[39G3900000 lines.[39G4000000 lines.[39G4100000 lines.[39G4200000 lines.[39G4300000 lines.[39G4400000 lines.[39G4500000 lines.[39G4600000 lines.[39G4700000 lines.[39G4800000 lines.[39G4900000 lines.[39G5000000 lines.[39G5100000 

[39G43100000 lines.[39G43200000 lines.[39G43300000 lines.[39G43400000 lines.[39G43500000 lines.[39G43600000 lines.[39G43700000 lines.[39G43800000 lines.[39G43900000 lines.[39G44000000 lines.[39G44100000 lines.[39G44200000 lines.[39G44300000 lines.[39G44400000 lines.[39G44500000 lines.[39G44500000 lines.[39G44600000 lines.[39G44700000 lines.[39G44800000 lines.[39G44800000 lines.[39G44900000 lines.[39G45000000 lines.[39G45100000 lines.[39G45200000 lines.[39G45300000 lines.[39G45400000 lines.[39G45500000 lines.[39G45600000 lines.[39G45700000 lines.[39G45800000 lines.[39G45900000 lines.[39G46000000 lines.[39G46100000 lines.[39G46200000 lines.[39G46300000 lines.[39G46400000 lines.[39G46500000 lines.[39G46600000 lines.[39G46700000 lines.[39G46700000 lines.[39G46800000 lines.[39G46900000 lines.[39G47000000 lines.[39G47100000 lines.[39G47200000 lines.[39G47300000 lines.[39G47400000 lines.[39G47500000 lines.[39G47600000 lines.[39G47700000 lines.

[39G86100000 lines.[39G86200000 lines.[39G86300000 lines.[39G86400000 lines.[39G86500000 lines.[39G86600000 lines.[39G86700000 lines.[39G86800000 lines.[39G86900000 lines.[39G86900000 lines.[39G87000000 lines.[39G87100000 lines.[39G87200000 lines.[39G87300000 lines.[39G87400000 lines.[39G87500000 lines.[39G87600000 lines.[39G87700000 lines.[39G87800000 lines.[39G87900000 lines.[39G88000000 lines.[39G88100000 lines.[39G88200000 lines.[39G88300000 lines.[39G88400000 lines.[39G88500000 lines.[39G88600000 lines.[39G88700000 lines.[39G88800000 lines.[39G88900000 lines.[39G89000000 lines.[39G89100000 lines.[39G89200000 lines.[39G89300000 lines.[39G89400000 lines.[39G89500000 lines.[39G89600000 lines.[39G89700000 lines.[39G89800000 lines.[39G89900000 lines.[39G90000000 lines.[39G90100000 lines.[39G90200000 lines.[39G90300000 lines.[39G90400000 lines.[39G90500000 lines.[39G90600000 lines.[39G90700000 lines.[39G90800000 lines.[39G90900000 lines.

make: Entering directory '/home/ashutosh/study/bias_manifold/scripts'
rm -rf glove shuffle cooccur vocab_count build
make: Leaving directory '/home/ashutosh/study/bias_manifold/scripts'
make: Entering directory '/home/ashutosh/study/bias_manifold/scripts'
mkdir -p build
gcc ./glove.c -o build/glove -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic


./glove.c: In function ‘save_params’:
  249 |               if (write_header) fprintf(fout, "%ld %d\n", vocab_size, vector_size);
      |                                                ~~^        ~~~~~~~~~~
      |                                                  |        |
      |                                                  long int long long int
      |                                                %lld
./glove.c: In function ‘initialize_parameters’:
   98 |             fread(&W[a], sizeof(real), 1, fin);
      |             ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./glove.c: In function ‘glove_thread’:
  133 |         fread(&cr, sizeof(CREC), 1, fin);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~


gcc ./shuffle.c -o build/shuffle -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic
gcc ./cooccur.c -o build/cooccur -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic


./shuffle.c: In function ‘shuffle_merge’:
  107 |                 fread(&array[i], sizeof(CREC), 1, fid[j]);
      |                 ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./shuffle.c: In function ‘shuffle_by_chunks’:
  165 |         fread(&array[i], sizeof(CREC), 1, fin);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./cooccur.c: In function ‘merge_files’:
  267 |         fread(&new, sizeof(CREC), 1, fid[i]);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
  277 |     fread(&new, sizeof(CREC), 1, fid[i]);
      |     ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
  290 |         fread(&new, sizeof(CREC), 1, fid[i]);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~


gcc ./vocab_count.c -o build/vocab_count -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic
make: Leaving directory '/home/ashutosh/study/bias_manifold/scripts'


BUILDING VOCABULARY


Processed 0 tokens.[11G100000 tokens.[11G200000 tokens.[11G300000 tokens.[11G400000 tokens.[11G500000 tokens.[11G600000 tokens.[11G700000 tokens.[11G800000 tokens.[11G900000 tokens.[11G1000000 tokens.[11G1100000 tokens.[11G1200000 tokens.[11G1300000 tokens.[11G1400000 tokens.[11G1500000 tokens.[11G1600000 tokens.[11G1700000 tokens.[11G1800000 tokens.[11G1900000 tokens.[11G2000000 tokens.[11G2100000 tokens.[11G2200000 tokens.[11G2300000 tokens.[11G2400000 tokens.[11G2500000 tokens.[11G2600000 tokens.[11G2700000 tokens.[11G2800000 tokens.[11G2900000 tokens.[11G3000000 tokens.[11G3100000 tokens.[11G3200000 tokens.[11G3300000 tokens.[11G3400000 tokens.[11G3500000 tokens.[11G3600000 tokens.[11G3700000 tokens.[11G3800000 tokens.[11G3900000 tokens.[11G4000000 tokens.[11G4100000 tokens.[11G4200000 tokens.[11G4300000 tokens.[11G4400000 tokens.[11G4500000 tokens.[11G4600000 tokens.[11G4700000 tokens.[11G4800000 tokens.[11G4900000 tokens.[11G50000

[11G47100000 tokens.[11G47200000 tokens.[11G47300000 tokens.[11G47400000 tokens.[11G47500000 tokens.[11G47600000 tokens.[11G47700000 tokens.[11G47800000 tokens.[11G47900000 tokens.[11G48000000 tokens.[11G48100000 tokens.[11G48200000 tokens.[11G48300000 tokens.[11G48400000 tokens.[11G48500000 tokens.[11G48600000 tokens.[11G48700000 tokens.[11G48800000 tokens.[11G48900000 tokens.[11G49000000 tokens.[11G49100000 tokens.[11G49200000 tokens.[11G49300000 tokens.[11G49400000 tokens.[11G49500000 tokens.[11G49600000 tokens.[11G49700000 tokens.[11G49800000 tokens.[11G49900000 tokens.[11G50000000 tokens.[11G50100000 tokens.[11G50200000 tokens.[11G50300000 tokens.[11G50400000 tokens.[11G50500000 tokens.[11G50600000 tokens.[11G50700000 tokens.[11G50800000 tokens.[11G50900000 tokens.[11G51000000 tokens.[11G51100000 tokens.[11G51200000 tokens.[11G51300000 tokens.[11G51400000 tokens.[11G51500000 tokens.[11G51600000 tokens.[11G51700000 tokens.[11G51800000

[11G88800000 tokens.[11G88900000 tokens.[11G89000000 tokens.[11G89100000 tokens.[11G89200000 tokens.[11G89300000 tokens.[11G89400000 tokens.[11G89500000 tokens.[11G89600000 tokens.[11G89700000 tokens.[11G89800000 tokens.[11G89900000 tokens.[11G90000000 tokens.[11G90100000 tokens.[11G90200000 tokens.[11G90300000 tokens.[11G90400000 tokens.[11G90500000 tokens.[11G90600000 tokens.[11G90700000 tokens.[11G90800000 tokens.[11G90900000 tokens.[11G91000000 tokens.[11G91100000 tokens.[11G91200000 tokens.[11G91300000 tokens.[11G91400000 tokens.[11G91500000 tokens.[11G91600000 tokens.[11G91700000 tokens.[11G91800000 tokens.[11G91900000 tokens.[11G92000000 tokens.[11G92100000 tokens.[11G92200000 tokens.[11G92300000 tokens.[11G92400000 tokens.[11G92500000 tokens.[11G92600000 tokens.[11G92700000 tokens.[11G92800000 tokens.[11G92900000 tokens.[11G93000000 tokens.[11G93100000 tokens.[11G93200000 tokens.[11G93300000 tokens.[11G93400000 tokens.[11G93500000

Processing token: 0[19G100000[19G200000[19G300000[19G400000[19G500000[19G600000[19G700000[19G800000[19G900000[19G1000000[19G1100000[19G1200000[19G1300000[19G1400000[19G1500000[19G1600000[19G1700000[19G1800000[19G1900000[19G2000000[19G2100000[19G2200000[19G2300000[19G2400000[19G2500000[19G2600000[19G2700000[19G2800000[19G2900000[19G3000000[19G3100000[19G3200000[19G3300000[19G3400000[19G3500000[19G3600000[19G3700000[19G3800000[19G3900000[19G4000000[19G4100000[19G4200000[19G4300000[19G4400000[19G4500000[19G4600000[19G4700000[19G4800000[19G4900000[19G5000000[19G5100000[19G5200000[19G5300000[19G5400000[19G5500000[19G5600000[19G5700000[19G5800000[19G5900000[19G6000000[19G6100000[19G6200000[19G6300000[19G6400000[19G6500000[19G6600000[19G6700000[19G6800000[19G6900000[19G7000000[19G7100000[19G7200000[19G7300000[19G7400000[19G7500000[19G7600000[19G7700000[19G7800000[19G7900000[19G8000000[19G8100000[19G8200000[19G8

[19G64600000[19G64700000[19G64800000[19G64900000[19G65000000[19G65100000[19G65200000[19G65300000[19G65400000[19G65500000[19G65600000[19G65700000[19G65800000[19G65900000[19G66000000[19G66100000[19G66200000[19G66300000[19G66400000[19G66500000[19G66600000[19G66700000[19G66800000[19G66900000[19G67000000[19G67100000[19G67200000[19G67300000[19G67400000[19G67500000[19G67600000[19G67700000[19G67800000[19G67900000[19G68000000[19G68100000[19G68200000[19G68300000[19G68400000[19G68500000[19G68600000[19G68700000[19G68800000[19G68900000[19G69000000[19G69100000[19G69200000[19G69300000[19G69400000[19G69500000[19G69600000[19G69700000[19G69800000[19G69900000[19G70000000[19G70100000[19G70200000[19G70300000[19G70400000[19G70500000[19G70600000[19G70700000[19G70800000[19G70900000[19G71000000[19G71100000[19G71200000[19G71300000[19G71400000[19G71500000[19G71600000[19G71700000[19G71800000[19G71900000[19G72000000[19G72100000[19G7220000

Merging cooccurrence files: processed 0 lines.[39G100000 lines.[39G200000 lines.[39G300000 lines.[39G400000 lines.[39G500000 lines.[39G600000 lines.[39G700000 lines.[39G800000 lines.[39G900000 lines.[39G1000000 lines.[39G1100000 lines.[39G1200000 lines.[39G1300000 lines.[39G1400000 lines.[39G1500000 lines.[39G1600000 lines.[39G1700000 lines.[39G1800000 lines.[39G1900000 lines.[39G2000000 lines.[39G2100000 lines.[39G2200000 lines.[39G2300000 lines.[39G2400000 lines.[39G2500000 lines.[39G2600000 lines.[39G2700000 lines.[39G2800000 lines.[39G2900000 lines.[39G3000000 lines.[39G3100000 lines.[39G3200000 lines.[39G3300000 lines.[39G3400000 lines.[39G3500000 lines.[39G3600000 lines.[39G3700000 lines.[39G3800000 lines.[39G3900000 lines.[39G4000000 lines.[39G4100000 lines.[39G4200000 lines.[39G4300000 lines.[39G4400000 lines.[39G4500000 lines.[39G4600000 lines.[39G4700000 lines.[39G4800000 lines.[39G4900000 lines.[39G5000000 lines.[39G5100000 

[39G40300000 lines.[39G40400000 lines.[39G40500000 lines.[39G40600000 lines.[39G40700000 lines.[39G40800000 lines.[39G40900000 lines.[39G41000000 lines.[39G41100000 lines.[39G41200000 lines.[39G41300000 lines.[39G41400000 lines.[39G41500000 lines.[39G41600000 lines.[39G41700000 lines.[39G41800000 lines.[39G41900000 lines.[39G42000000 lines.[39G42100000 lines.[39G42100000 lines.[39G42100000 lines.[39G42200000 lines.[39G42300000 lines.[39G42400000 lines.[39G42400000 lines.[39G42500000 lines.[39G42600000 lines.[39G42700000 lines.[39G42800000 lines.[39G42900000 lines.[39G43000000 lines.[39G43100000 lines.[39G43200000 lines.[39G43300000 lines.[39G43400000 lines.[39G43500000 lines.[39G43600000 lines.[39G43700000 lines.[39G43800000 lines.[39G43900000 lines.[39G44000000 lines.[39G44100000 lines.[39G44200000 lines.[39G44300000 lines.[39G44400000 lines.[39G44500000 lines.[39G44600000 lines.[39G44700000 lines.[39G44800000 lines.[39G44800000 lines.

[39G80700000 lines.[39G80800000 lines.[39G80900000 lines.[39G81000000 lines.[39G81100000 lines.[39G81200000 lines.[39G81300000 lines.[39G81400000 lines.[39G81500000 lines.[39G81600000 lines.[39G81700000 lines.[39G81800000 lines.[39G81900000 lines.[39G82000000 lines.[39G82100000 lines.[39G82200000 lines.[39G82300000 lines.[39G82400000 lines.[39G82500000 lines.[39G82600000 lines.[39G82700000 lines.[39G82700000 lines.[39G82800000 lines.[39G82900000 lines.[39G83000000 lines.[39G83000000 lines.[39G83100000 lines.[39G83200000 lines.[39G83300000 lines.[39G83400000 lines.[39G83500000 lines.[39G83600000 lines.[39G83700000 lines.[39G83800000 lines.[39G83900000 lines.[39G84000000 lines.[39G84000000 lines.[39G84100000 lines.[39G84200000 lines.[39G84300000 lines.[39G84400000 lines.[39G84500000 lines.[39G84600000 lines.[39G84700000 lines.[39G84800000 lines.[39G84900000 lines.[39G85000000 lines.[39G85100000 lines.[39G85100000 lines.[39G85200000 lines.

[39G121300000 lines.[39G121400000 lines.[39G121500000 lines.[39G121600000 lines.[39G121700000 lines.[39G121800000 lines.[39G121900000 lines.[39G122000000 lines.[39G122100000 lines.[39G122200000 lines.[39G122300000 lines.[39G122400000 lines.[39G122500000 lines.[39G122600000 lines.[39G122700000 lines.[39G122800000 lines.[39G122900000 lines.[39G123000000 lines.[39G123100000 lines.[39G123200000 lines.[0GMerging cooccurrence files: processed 123256244 lines.

SHUFFLING COOCCURRENCES
array size: 382520524
Shuffling by chunks: processed 0 lines.[22Gprocessed 123256244 lines.
Wrote 1 temporary file(s).
Merging temp files: processed 0 lines.[31G123256244 lines.[0GMerging temp files: processed 123256244 lines.

TRAINING MODEL
Read 123256244 lines.
Initializing parameters... done.
vector size: 100
vocab size: 212059
x_max: 100.000000
alpha: 0.750000
11/18/22 - 01:14.16PM, iter: 001, cost: 0.033477
11/18/22 - 01:14.46PM, iter: 002, cost: 0.023351
11/18/22 - 01:15.14PM, iter

make: Entering directory '/home/ashutosh/study/bias_manifold/scripts'
rm -rf glove shuffle cooccur vocab_count build
make: Leaving directory '/home/ashutosh/study/bias_manifold/scripts'
make: Entering directory '/home/ashutosh/study/bias_manifold/scripts'
mkdir -p build
gcc ./glove.c -o build/glove -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic


./glove.c: In function ‘save_params’:
  249 |               if (write_header) fprintf(fout, "%ld %d\n", vocab_size, vector_size);
      |                                                ~~^        ~~~~~~~~~~
      |                                                  |        |
      |                                                  long int long long int
      |                                                %lld
./glove.c: In function ‘initialize_parameters’:
   98 |             fread(&W[a], sizeof(real), 1, fin);
      |             ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./glove.c: In function ‘glove_thread’:
  133 |         fread(&cr, sizeof(CREC), 1, fin);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~


gcc ./shuffle.c -o build/shuffle -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic
gcc ./cooccur.c -o build/cooccur -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic


./shuffle.c: In function ‘shuffle_merge’:
  107 |                 fread(&array[i], sizeof(CREC), 1, fid[j]);
      |                 ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./shuffle.c: In function ‘shuffle_by_chunks’:
  165 |         fread(&array[i], sizeof(CREC), 1, fin);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./cooccur.c: In function ‘merge_files’:
  267 |         fread(&new, sizeof(CREC), 1, fid[i]);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
  277 |     fread(&new, sizeof(CREC), 1, fid[i]);
      |     ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
  290 |         fread(&new, sizeof(CREC), 1, fid[i]);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~


gcc ./vocab_count.c -o build/vocab_count -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic
make: Leaving directory '/home/ashutosh/study/bias_manifold/scripts'


BUILDING VOCABULARY


Processed 0 tokens.[11G100000 tokens.[11G200000 tokens.[11G300000 tokens.[11G400000 tokens.[11G500000 tokens.[11G600000 tokens.[11G700000 tokens.[11G800000 tokens.[11G900000 tokens.[11G1000000 tokens.[11G1100000 tokens.[11G1200000 tokens.[11G1300000 tokens.[11G1400000 tokens.[11G1500000 tokens.[11G1600000 tokens.[11G1700000 tokens.[11G1800000 tokens.[11G1900000 tokens.[11G2000000 tokens.[11G2100000 tokens.[11G2200000 tokens.[11G2300000 tokens.[11G2400000 tokens.[11G2500000 tokens.[11G2600000 tokens.[11G2700000 tokens.[11G2800000 tokens.[11G2900000 tokens.[11G3000000 tokens.[11G3100000 tokens.[11G3200000 tokens.[11G3300000 tokens.[11G3400000 tokens.[11G3500000 tokens.[11G3600000 tokens.[11G3700000 tokens.[11G3800000 tokens.[11G3900000 tokens.[11G4000000 tokens.[11G4100000 tokens.[11G4200000 tokens.[11G4300000 tokens.[11G4400000 tokens.[11G4500000 tokens.[11G4600000 tokens.[11G4700000 tokens.[11G4800000 tokens.[11G4900000 tokens.[11G50000

[11G48200000 tokens.[11G48300000 tokens.[11G48400000 tokens.[11G48500000 tokens.[11G48600000 tokens.[11G48700000 tokens.[11G48800000 tokens.[11G48900000 tokens.[11G49000000 tokens.[11G49100000 tokens.[11G49200000 tokens.[11G49300000 tokens.[11G49400000 tokens.[11G49500000 tokens.[11G49600000 tokens.[11G49700000 tokens.[11G49800000 tokens.[11G49900000 tokens.[11G50000000 tokens.[11G50100000 tokens.[11G50200000 tokens.[11G50300000 tokens.[11G50400000 tokens.[11G50500000 tokens.[11G50600000 tokens.[11G50700000 tokens.[11G50800000 tokens.[11G50900000 tokens.[11G51000000 tokens.[11G51100000 tokens.[11G51200000 tokens.[11G51300000 tokens.[11G51400000 tokens.[11G51500000 tokens.[11G51600000 tokens.[11G51700000 tokens.[11G51800000 tokens.[11G51900000 tokens.[11G52000000 tokens.[11G52100000 tokens.[11G52200000 tokens.[11G52300000 tokens.[11G52400000 tokens.[11G52500000 tokens.[11G52600000 tokens.[11G52700000 tokens.[11G52800000 tokens.[11G52900000

[11G87300000 tokens.[11G87400000 tokens.[11G87500000 tokens.[11G87600000 tokens.[11G87700000 tokens.[11G87800000 tokens.[11G87900000 tokens.[11G88000000 tokens.[11G88100000 tokens.[11G88200000 tokens.[11G88300000 tokens.[11G88400000 tokens.[11G88500000 tokens.[11G88600000 tokens.[11G88700000 tokens.[11G88800000 tokens.[11G88900000 tokens.[11G89000000 tokens.[11G89100000 tokens.[11G89200000 tokens.[11G89300000 tokens.[11G89400000 tokens.[11G89500000 tokens.[11G89600000 tokens.[11G89700000 tokens.[11G89800000 tokens.[11G89900000 tokens.[11G90000000 tokens.[11G90100000 tokens.[11G90200000 tokens.[11G90300000 tokens.[11G90400000 tokens.[11G90500000 tokens.[11G90600000 tokens.[11G90700000 tokens.[11G90800000 tokens.[11G90900000 tokens.[11G91000000 tokens.[11G91100000 tokens.[11G91200000 tokens.[11G91300000 tokens.[11G91400000 tokens.[11G91500000 tokens.[11G91600000 tokens.[11G91700000 tokens.[11G91800000 tokens.[11G91900000 tokens.[11G92000000

Processing token: 0[19G100000[19G200000[19G300000[19G400000[19G500000[19G600000[19G700000[19G800000[19G900000[19G1000000[19G1100000[19G1200000[19G1300000[19G1400000[19G1500000[19G1600000[19G1700000[19G1800000[19G1900000[19G2000000[19G2100000[19G2200000[19G2300000[19G2400000[19G2500000[19G2600000[19G2700000[19G2800000[19G2900000[19G3000000[19G3100000[19G3200000[19G3300000[19G3400000[19G3500000[19G3600000[19G3700000[19G3800000[19G3900000[19G4000000[19G4100000[19G4200000[19G4300000[19G4400000[19G4500000[19G4600000[19G4700000[19G4800000[19G4900000[19G5000000[19G5100000[19G5200000[19G5300000[19G5400000[19G5500000[19G5600000[19G5700000[19G5800000[19G5900000[19G6000000[19G6100000[19G6200000[19G6300000[19G6400000[19G6500000[19G6600000[19G6700000[19G6800000[19G6900000[19G7000000[19G7100000[19G7200000[19G7300000[19G7400000[19G7500000[19G7600000[19G7700000[19G7800000[19G7900000[19G8000000[19G8100000[19G8200000[19G8

[19G64700000[19G64800000[19G64900000[19G65000000[19G65100000[19G65200000[19G65300000[19G65400000[19G65500000[19G65600000[19G65700000[19G65800000[19G65900000[19G66000000[19G66100000[19G66200000[19G66300000[19G66400000[19G66500000[19G66600000[19G66700000[19G66800000[19G66900000[19G67000000[19G67100000[19G67200000[19G67300000[19G67400000[19G67500000[19G67600000[19G67700000[19G67800000[19G67900000[19G68000000[19G68100000[19G68200000[19G68300000[19G68400000[19G68500000[19G68600000[19G68700000[19G68800000[19G68900000[19G69000000[19G69100000[19G69200000[19G69300000[19G69400000[19G69500000[19G69600000[19G69700000[19G69800000[19G69900000[19G70000000[19G70100000[19G70200000[19G70300000[19G70400000[19G70500000[19G70600000[19G70700000[19G70800000[19G70900000[19G71000000[19G71100000[19G71200000[19G71300000[19G71400000[19G71500000[19G71600000[19G71700000[19G71800000[19G71900000[19G72000000[19G72100000[19G72200000[19G7230000

Merging cooccurrence files: processed 0 lines.[39G100000 lines.[39G200000 lines.[39G300000 lines.[39G400000 lines.[39G500000 lines.[39G600000 lines.[39G700000 lines.[39G800000 lines.[39G900000 lines.[39G1000000 lines.[39G1100000 lines.[39G1200000 lines.[39G1300000 lines.[39G1400000 lines.[39G1500000 lines.[39G1600000 lines.[39G1700000 lines.[39G1800000 lines.[39G1900000 lines.[39G2000000 lines.[39G2100000 lines.[39G2200000 lines.[39G2300000 lines.[39G2400000 lines.[39G2500000 lines.[39G2600000 lines.[39G2700000 lines.[39G2800000 lines.[39G2900000 lines.[39G3000000 lines.[39G3100000 lines.[39G3200000 lines.[39G3300000 lines.[39G3400000 lines.[39G3500000 lines.[39G3600000 lines.[39G3700000 lines.[39G3800000 lines.[39G3900000 lines.[39G4000000 lines.[39G4100000 lines.[39G4200000 lines.[39G4300000 lines.[39G4400000 lines.[39G4500000 lines.[39G4600000 lines.[39G4700000 lines.[39G4800000 lines.[39G4900000 lines.[39G5000000 lines.[39G5100000 

[39G40700000 lines.[39G40800000 lines.[39G40900000 lines.[39G41000000 lines.[39G41100000 lines.[39G41200000 lines.[39G41300000 lines.[39G41400000 lines.[39G41500000 lines.[39G41600000 lines.[39G41700000 lines.[39G41800000 lines.[39G41900000 lines.[39G42000000 lines.[39G42100000 lines.[39G42200000 lines.[39G42300000 lines.[39G42400000 lines.[39G42500000 lines.[39G42600000 lines.[39G42700000 lines.[39G42800000 lines.[39G42900000 lines.[39G43000000 lines.[39G43100000 lines.[39G43200000 lines.[39G43300000 lines.[39G43400000 lines.[39G43500000 lines.[39G43600000 lines.[39G43700000 lines.[39G43800000 lines.[39G43900000 lines.[39G44000000 lines.[39G44100000 lines.[39G44200000 lines.[39G44300000 lines.[39G44400000 lines.[39G44500000 lines.[39G44600000 lines.[39G44700000 lines.[39G44800000 lines.[39G44900000 lines.[39G45000000 lines.[39G45100000 lines.[39G45200000 lines.[39G45300000 lines.[39G45400000 lines.[39G45500000 lines.[39G45600000 lines.

[39G83100000 lines.[39G83200000 lines.[39G83300000 lines.[39G83400000 lines.[39G83500000 lines.[39G83600000 lines.[39G83700000 lines.[39G83800000 lines.[39G83900000 lines.[39G84000000 lines.[39G84100000 lines.[39G84200000 lines.[39G84300000 lines.[39G84400000 lines.[39G84500000 lines.[39G84600000 lines.[39G84700000 lines.[39G84800000 lines.[39G84900000 lines.[39G85000000 lines.[39G85100000 lines.[39G85200000 lines.[39G85300000 lines.[39G85400000 lines.[39G85500000 lines.[39G85600000 lines.[39G85700000 lines.[39G85800000 lines.[39G85900000 lines.[39G86000000 lines.[39G86100000 lines.[39G86200000 lines.[39G86300000 lines.[39G86400000 lines.[39G86500000 lines.[39G86600000 lines.[39G86700000 lines.[39G86800000 lines.[39G86900000 lines.[39G87000000 lines.[39G87100000 lines.[39G87200000 lines.[39G87300000 lines.[39G87400000 lines.[39G87500000 lines.[39G87600000 lines.[39G87700000 lines.[39G87800000 lines.[39G87900000 lines.[39G88000000 lines.

make: Entering directory '/home/ashutosh/study/bias_manifold/scripts'
rm -rf glove shuffle cooccur vocab_count build
make: Leaving directory '/home/ashutosh/study/bias_manifold/scripts'
make: Entering directory '/home/ashutosh/study/bias_manifold/scripts'
mkdir -p build
gcc ./glove.c -o build/glove -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic


./glove.c: In function ‘save_params’:
  249 |               if (write_header) fprintf(fout, "%ld %d\n", vocab_size, vector_size);
      |                                                ~~^        ~~~~~~~~~~
      |                                                  |        |
      |                                                  long int long long int
      |                                                %lld
./glove.c: In function ‘initialize_parameters’:
   98 |             fread(&W[a], sizeof(real), 1, fin);
      |             ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./glove.c: In function ‘glove_thread’:
  133 |         fread(&cr, sizeof(CREC), 1, fin);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~


gcc ./shuffle.c -o build/shuffle -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic
gcc ./cooccur.c -o build/cooccur -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic


./shuffle.c: In function ‘shuffle_merge’:
  107 |                 fread(&array[i], sizeof(CREC), 1, fid[j]);
      |                 ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./shuffle.c: In function ‘shuffle_by_chunks’:
  165 |         fread(&array[i], sizeof(CREC), 1, fin);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
./cooccur.c: In function ‘merge_files’:
  267 |         fread(&new, sizeof(CREC), 1, fid[i]);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
  277 |     fread(&new, sizeof(CREC), 1, fid[i]);
      |     ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
  290 |         fread(&new, sizeof(CREC), 1, fid[i]);
      |         ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~


gcc ./vocab_count.c -o build/vocab_count -lm -pthread -Ofast -march=native -funroll-loops -Wall -Wextra -Wpedantic
make: Leaving directory '/home/ashutosh/study/bias_manifold/scripts'


BUILDING VOCABULARY
Processed 0 tokens.[11G100000 tokens.[11G200000 tokens.[11G300000 tokens.[11G400000 tokens.[11G500000 tokens.[11G600000 tokens.[11G700000 tokens.[11G800000 tokens.[11G900000 tokens.[11G1000000 tokens.[11G1100000 tokens.[11G1200000 tokens.[11G1300000 tokens.[11G1400000 tokens.[11G1500000 tokens.[11G1600000 tokens.[11G1700000 tokens.[11G1800000 tokens.[11G1900000 tokens.[11G2000000 tokens.[11G2100000 tokens.[11G2200000 tokens.[11G2300000 tokens.[11G2400000 tokens.[11G2500000 tokens.[11G2600000 tokens.[11G2700000 tokens.[11G2800000 tokens.[11G2900000 tokens.[11G3000000 tokens.[11G3100000 tokens.[11G3200000 tokens.[11G3300000 tokens.[11G3400000 tokens.[11G3500000 tokens.[11G3600000 tokens.[11G3700000 tokens.[11G3800000 tokens.[11G3900000 tokens.[11G4000000 tokens.[11G4100000 tokens.[11G4200000 tokens.[11G4300000 tokens.[11G4400000 tokens.[11G4500000 tokens.[11G4600000 tokens.[11G4700000 tokens.[11G4800000 tokens.[11G49000

Processing token: 0[19G100000[19G200000[19G300000[19G400000[19G500000[19G600000[19G700000[19G800000[19G900000[19G1000000[19G1100000[19G1200000[19G1300000[19G1400000[19G1500000[19G1600000[19G1700000[19G1800000[19G1900000[19G2000000[19G2100000[19G2200000[19G2300000[19G2400000[19G2500000[19G2600000[19G2700000[19G2800000[19G2900000[19G3000000[19G3100000[19G3200000[19G3300000[19G3400000[19G3500000[19G3600000[19G3700000[19G3800000[19G3900000[19G4000000[19G4100000[19G4200000[19G4300000[19G4400000[19G4500000[19G4600000[19G4700000[19G4800000[19G4900000[19G5000000[19G5100000[19G5200000[19G5300000[19G5400000[19G5500000[19G5600000[19G5700000[19G5800000[19G5900000[19G6000000[19G6100000[19G6200000[19G6300000[19G6400000[19G6500000[19G6600000[19G6700000[19G6800000[19G6900000[19G7000000[19G7100000[19G7200000[19G7300000[19G7400000[19G7500000[19G7600000[19G7700000[19G7800000[19G7900000[19G8000000[19G8100000[19G8200000[19G8

Merging cooccurrence files: processed 0 lines.[39G100000 lines.[39G200000 lines.[39G300000 lines.[39G400000 lines.[39G500000 lines.[39G600000 lines.[39G700000 lines.[39G800000 lines.[39G900000 lines.[39G1000000 lines.[39G1100000 lines.[39G1200000 lines.[39G1300000 lines.[39G1400000 lines.[39G1500000 lines.[39G1600000 lines.[39G1700000 lines.[39G1800000 lines.[39G1900000 lines.[39G2000000 lines.[39G2100000 lines.[39G2200000 lines.[39G2300000 lines.[39G2400000 lines.[39G2500000 lines.[39G2600000 lines.[39G2700000 lines.[39G2800000 lines.[39G2900000 lines.[39G3000000 lines.[39G3100000 lines.[39G3200000 lines.[39G3300000 lines.[39G3400000 lines.[39G3500000 lines.[39G3600000 lines.[39G3700000 lines.[39G3800000 lines.[39G3900000 lines.[39G4000000 lines.[39G4100000 lines.[39G4200000 lines.[39G4300000 lines.[39G4400000 lines.[39G4500000 lines.[39G4600000 lines.[39G4700000 lines.[39G4800000 lines.[39G4900000 lines.[39G5000000 lines.[39G5100000 

[39G41800000 lines.[39G41900000 lines.[39G42000000 lines.[39G42100000 lines.[39G42200000 lines.[39G42300000 lines.[39G42400000 lines.[39G42500000 lines.[39G42600000 lines.[39G42700000 lines.[39G42800000 lines.[39G42900000 lines.[39G43000000 lines.[39G43100000 lines.[39G43200000 lines.[39G43300000 lines.[39G43400000 lines.[39G43500000 lines.[39G43600000 lines.[39G43700000 lines.[39G43800000 lines.[39G43900000 lines.[39G44000000 lines.[39G44100000 lines.[39G44200000 lines.[39G44300000 lines.[39G44400000 lines.[39G44500000 lines.[39G44600000 lines.[39G44700000 lines.[39G44800000 lines.[39G44900000 lines.[39G45000000 lines.[39G45100000 lines.[39G45200000 lines.[39G45300000 lines.[39G45400000 lines.[39G45500000 lines.[39G45600000 lines.[39G45700000 lines.[39G45800000 lines.[39G45900000 lines.[39G46000000 lines.[39G46100000 lines.[39G46200000 lines.[39G46300000 lines.[39G46400000 lines.[39G46500000 lines.[39G46600000 lines.[39G46700000 lines.