In [1]:
%load_ext autoreload
%autoreload 2
%matplotlib notebook

import numpy as np
import matplotlib.pyplot as plt
from scipy.optimize import root
import h5py
import os

## Read in single file output

In [2]:
# Uncomment to read in a single file
"""
ftype = 'h5'
base = 'output/'
cfg = 'cl3_16_48_b6p1_m0p2450_output1693'
file = base + cfg + '.' + ftype
L3 = 48    #temporal extent of lattice
C = []
if ftype == 'txt':
    f = open(file, 'r')
    # New read in format: Each line after the first of form cfgId|a1+ib a2+ib ...
    f.readline()
    for i, line in enumerate(f):
        # if i not in sample_ids:
        #     continue
        cur_line = np.zeros(L3, dtype=complex)
        cfgIdx, rest = line.split('|')
        cfgIdx = int(cfgIdx)
        interps = rest.split(' ')    # now get real and complex
        for n_t, x in enumerate(interps):
            if not x.isspace():
                real, imag = x.split('+i(')    #form should be x = a+i(b)
                real = float(real)
                imag = float(imag.replace(')', ''))
                cur_line[n_t] = complex(real, imag)
        cur_line = [cur_line]
        if C == []:
            C = np.array(cur_line)
        else:
            C = np.append(C, cur_line, axis = 0)
elif ftype == 'h5':
    f = h5py.File(file, 'r')
    correlators = f['twopt']
    for i, data in correlators.items():
        if C == []:
            C = np.array(data)
        else:
            C = np.vstack([C, data])
else:
    raise Exception("File type cannot be read in.")
"""

'\nftype = \'h5\'\nbase = \'output/\'\ncfg = \'cl3_16_48_b6p1_m0p2450_output1693\'\nfile = base + cfg + \'.\' + ftype\nL3 = 48    #temporal extent of lattice\nC = []\nif ftype == \'txt\':\n    f = open(file, \'r\')\n    # New read in format: Each line after the first of form cfgId|a1+ib a2+ib ...\n    f.readline()\n    for i, line in enumerate(f):\n        # if i not in sample_ids:\n        #     continue\n        cur_line = np.zeros(L3, dtype=complex)\n        cfgIdx, rest = line.split(\'|\')\n        cfgIdx = int(cfgIdx)\n        interps = rest.split(\' \')    # now get real and complex\n        for n_t, x in enumerate(interps):\n            if not x.isspace():\n                real, imag = x.split(\'+i(\')    #form should be x = a+i(b)\n                real = float(real)\n                imag = float(imag.replace(\')\', \'\'))\n                cur_line[n_t] = complex(real, imag)\n        cur_line = [cur_line]\n        if C == []:\n            C = np.array(cur_line)\n        else:\n 

## Read in single directory output

In [3]:
# Uncomment for single directory output
ftype = 'h5'
job_num = 5023
base = './output/job' + str(job_num)
files = []
for (dirpath, dirnames, file) in os.walk(base):
    files.extend(file)
C = []
for file in files:
    path_to_file = base + '/' + file
    f = h5py.File(path_to_file, 'r')
    correlators = f['twopt']
    for i, data in correlators.items():
        if len(C) == 0:
            C = np.array(data)
        else:
            C = np.vstack([C, data])

In [4]:
def bootstrap(C, n_boot = 500):
    num_configs = C.shape[0]
    n_t = C.shape[1]
    samples = np.zeros((n_boot, num_configs, n_t), dtype = complex)
    for i in range(n_boot):
        cfgIds = np.random.choice(num_configs, num_configs)    #Configuration ids to pick
        samples[i, :, :] = C[cfgIds, :]
    return samples

In [5]:
num_configs = C.shape[0]
n_t = C.shape[1]
samples = bootstrap(C)
print(samples.shape)

(500, 253, 48)


## Compute correlation function and effective mass

In [6]:
# Compute ensemble average of each correlation function
ensemble_avg = np.mean(samples, axis = 1)
μ_C = np.abs(np.mean(ensemble_avg, axis = 0))
σ_C = np.abs(np.std(ensemble_avg, axis = 0))

In [7]:
# Compute effective mass
ratios = np.abs(ensemble_avg / np.roll(ensemble_avg, shift = -1, axis = 1))[:, :-1]
m_eff_ensemble = np.log(ratios)
μ_m_eff = np.mean(m_eff_ensemble, axis = 0)
σ_m_eff = np.std(m_eff_ensemble, axis = 0, ddof = 1)

In [8]:
# Compute cosh-corrected effective mass
N = 48
cosh_m_eff_ensemble = np.zeros(ratios.shape)
for ens_idx in range(ratios.shape[0]):
    for t in range(ratios.shape[1]):
        m = root(lambda m : ratios[ens_idx, t] - np.cosh(m * (t - N / 2)) / np.cosh(m * (t + 1 - N / 2)), \
                     m_eff_ensemble[ens_idx, t])
        cosh_m_eff_ensemble[ens_idx, t] = m.x
μ_cosh = np.mean(cosh_m_eff_ensemble, axis = 0)
σ_cosh = np.std(cosh_m_eff_ensemble, axis = 0, ddof = 1)

In [9]:
plt.figure()
plt.errorbar(range(1, n_t + 1), μ_C, yerr = σ_C)
plt.yscale('log')
plt.title('Correlation functions')
plt.xlabel('$n_t$')
plt.ylabel('$log(C(n_t))$')

<IPython.core.display.Javascript object>

Text(0, 0.5, '$log(C(n_t))$')

In [10]:
plt.figure()
plt.errorbar(range(1, n_t), μ_m_eff, yerr = σ_m_eff)
plt.title('Effective mass')
plt.ylim((-5, 5))
plt.xlabel('$n_t$')
plt.ylabel('$m_{eff}$')

<IPython.core.display.Javascript object>

Text(0, 0.5, '$m_{eff}$')

In [11]:
plt.figure()
plt.plot(range(1, n_t), μ_cosh, 'r', label = 'cosh-corrected')
plt.plot(range(1, n_t), μ_m_eff, 'b', label = 'exponential')

plt.title('$m_{eff}$ vs. cosh-corrected $m_{eff}$')
# plt.ylim((-3, 3))
plt.xlabel('$n_t$')
plt.ylabel('$m_{eff}$')
plt.legend()

plt.show()

<IPython.core.display.Javascript object>

In [12]:
# plt.savefig('/Users/theoares/lqcd/pion_mass/output/' + cfg + '.png')

## Determine error scaling

In [13]:
base_time = 15
cfg_list = range(10, num_configs, 10)
err = np.zeros(len(cfg_list))
means = np.zeros(len(cfg_list))
for i, n in enumerate(cfg_list):    # sample n configurations from C
    config_ids = np.random.choice(num_configs, n, replace = False)
    C_sub = C[config_ids, :]    #now get error on the subsampled C
    subensemble = bootstrap(C_sub)
    subensemble_avg = np.mean(subensemble, axis = 1)
    μ = np.abs(np.mean(subensemble_avg, axis = 0))
    σ = np.abs(np.std(subensemble_avg, axis = 0))
    err[i] = σ[base_time]
    means[i] = μ[base_time]

In [14]:
print('Errors are: ', err)
print('Average correlation function is: ', means)

Errors are:  [1.08085207e-16 1.06849481e-16 6.39755271e-17 6.91766515e-17
 6.70445917e-17 6.53291432e-17 5.34461587e-17 4.56362557e-17
 5.01179898e-17 4.77923928e-17 3.92747990e-17 4.22023141e-17
 3.58833162e-17 3.86533867e-17 3.72532598e-17 3.48198296e-17
 3.69853594e-17 3.40810431e-17 3.18610162e-17 3.33510148e-17
 3.12641102e-17 3.01996528e-17 2.96845761e-17 2.99960764e-17
 2.81145106e-17]
Average correlation function is:  [1.73249607e-16 1.21895040e-17 8.17520579e-17 1.05524246e-16
 1.27362076e-16 1.31791744e-16 4.94365555e-17 7.10241911e-17
 7.87663357e-17 3.95128296e-17 6.06801081e-17 7.10862392e-17
 8.73036556e-18 7.22944128e-17 8.12817387e-17 5.43027899e-17
 4.47626356e-17 6.84324139e-17 5.66388511e-17 4.45925964e-17
 4.80246372e-17 5.49016116e-17 6.29879527e-17 4.99571608e-17
 4.96630861e-17]


In [15]:
plt.figure()
plt.scatter(cfg_list, err)
plt.title('Error scaling')
plt.xlabel('Number of configurations sampled')
plt.ylabel('Error at time $n_t$ = ' + str(base_time))
# plt.ylim((1e-18, 1e-17))
plt.ylim((.9 * np.min(err), 1.1 * np.max(err)))
plt.show()

<IPython.core.display.Javascript object>