In [1]:
from simulations.local_chi2_cpm import get_all_pairwise_pearson_categorical_divergences_and_p_values
import time
import datetime
import numpy as np
from pathlib import Path

In [2]:
base_relative_abundances = [1e-4, 1e-3, 1e-2]

relative_abundances = [relative_abundance * number
                       for relative_abundance 
                       in base_relative_abundances
                       for number in (1,2,5) 
                       for repeat in range(10)]

relative_abundances += [1-sum(relative_abundances)]
frequencies = np.array(relative_abundances)

rate = 2

In [3]:
npzfile = np.load('CPIDM_results.npz')
droplets = npzfile['droplets']

In [4]:
results_filename = 'pairwise_results.npz'
results_file = Path(results_filename)

start_time = time.time()
divergences, pvals, sign_vectors = get_all_pairwise_pearson_categorical_divergences_and_p_values(droplets, frequencies, rate=rate, signs=True)
runtime = time.time() - start_time

with open('runtime.log', 'a') as file_pointer:
    # https://stackoverflow.com/a/775095/10634604
    runtime_string = str(datetime.timedelta(seconds=runtime))
    file_pointer.write('\nRuntime for the pairwise/local hypothesis tests was {} in Hours:Minutes:Seconds.\n'.format(runtime_string))

results_file.parent.mkdir(parents=True, exist_ok=True)
np.savez_compressed(results_filename, divergences=divergences, pvals=pvals, 
                   sign_vectors=sign_vectors)