## Imports

In [1]:
# Import necessary libraries and functions

from aux.imports import *
from aux.aux_scraper import scrape_all_pages, fetch_abstract, get_total_pages_from_inspire, add_abstracts
from aux.aux_functions import *

import openai
from openai import OpenAI

import pandas as pd
pd.set_option('display.max_colwidth', None)

from IPython.display import display

import os
import requests
import tarfile

openai.api_key = os.environ["OPENAI_API_KEY"]

# Directory to save the downloaded source files
save_dir = 'my_papers/original_texs'
polished_dir = 'my_papers/polished_texs'

os.makedirs(save_dir, exist_ok=True)
os.makedirs(polished_dir, exist_ok=True)

In [2]:
# Set up Chrome options for headless browsing
chrome_options = Options()
chrome_options.add_argument("--headless")  # Runs Chrome in headless mode

# Initialize the WebDriver with the specified options
driver = webdriver.Chrome(options=chrome_options)

In [3]:
url = "https://inspirehep.net/literature?sort=mostrecent&size=250&page=1&q=a%20muia&ui-citation-summary=true"

In [4]:
df = scrape_all_pages(driver, url)
df.head()

https://inspirehep.net/literature?sort=mostrecent&size=250&q=a%20muia&ui-citation-summary=true


Unnamed: 0,Title,Authors,ePrint Number,arXiv Category,DOI,Citation Count
0,String Thermodynamics In and Out of Equilibrium: Boltzmann Equations and Random Walks,"A. R. Frey, R. Mahanta, A. Maharana, F. Muia, F. Quevedo",2310.11494,hep-th,,1
1,"Quantum Transitions, Detailed Balance, Black Holes and Nothingness","S. Cespedes, S. de Alwis, F. Muia, F. Quevedo",2307.13614,hep-th,,4
2,Oscillon formation during inflationary preheating with general relativity,"J. C. Aurrekoetxea, K. Clough, F. Muia",2304.01673,gr-qc,10.1103/PhysRevD.108.023501,11
3,Testing BSM physics with gravitational waves,"F. Muia, F. Quevedo, A. Schachner, G. Villa",2303.01548,hep-ph,10.1088/1475-7516/2023/09/006,8
4,Hunt for light primordial black hole dark matter with ultrahigh-frequency gravitational waves,"G. Franciolini, A. Maharana, F. Muia",2205.02153,astro-ph.CO,10.1103/PhysRevD.106.103520,48


In [5]:
list_of_arxiv_no = df['ePrint Number'].tolist()

In [6]:
for arxiv_id in list_of_arxiv_no:
    url = f'http://arxiv.org/e-print/{arxiv_id}'
    
    # Make the request and download the file
    response = requests.get(url)
    
    if response.status_code == 200:
        tar_path = os.path.join(save_dir, f'{arxiv_id}.tar.gz')
        
        with open(tar_path, 'wb') as file:
            file.write(response.content)
        print(f'Downloaded {arxiv_id}')
        
        # Extract .tex files from the downloaded tar.gz file, if valid
        extract_to = os.path.join(save_dir)  # Specify the directory for extracted files
        os.makedirs(extract_to, exist_ok=True)
        if extract_tex_files(tar_path, extract_to, arxiv_id):
            print(f'Extracted LaTeX sources for {arxiv_id}')
        else:
            print(f'{arxiv_id}.tar.gz is not a valid archive or does not contain .tex files.')
        
        # Optionally, delete the .tar.gz file regardless of extraction success
        os.remove(tar_path)
        print(f'Deleted archive {arxiv_id}.tar.gz')
    else:
        print(f'Failed to download {arxiv_id}. Status code: {response.status_code}')

Downloaded 2310.11494
Extracted LaTeX sources for 2310.11494
Deleted archive 2310.11494.tar.gz
Downloaded 2307.13614
Extracted LaTeX sources for 2307.13614
Deleted archive 2307.13614.tar.gz
Downloaded 2304.01673
Extracted LaTeX sources for 2304.01673
Deleted archive 2304.01673.tar.gz
Downloaded 2303.01548
Extracted LaTeX sources for 2303.01548
Deleted archive 2303.01548.tar.gz
Downloaded 2205.02153
Extracted LaTeX sources for 2205.02153
Deleted archive 2205.02153.tar.gz
Downloaded 2112.11486
Extracted LaTeX sources for 2112.11486
Deleted archive 2112.11486.tar.gz
Downloaded 2112.11650
Extracted LaTeX sources for 2112.11650
Deleted archive 2112.11650.tar.gz
Downloaded 2201.03458
2201.03458.tar.gz is not a valid archive or does not contain .tex files.
Deleted archive 2201.03458.tar.gz
Downloaded 2107.12392
Extracted LaTeX sources for 2107.12392
Deleted archive 2107.12392.tar.gz
Downloaded 2107.03391
Extracted LaTeX sources for 2107.03391
Deleted archive 2107.03391.tar.gz
Downloaded 2103.

In [6]:
newcommand_pattern = re.compile(r'\\newcommand\{\\(\w+)\}\s*\{((?:[^{}]|{[^{}]*})*)\}')

all_matches = []  # This will aggregate all matches from all files

for filename in os.listdir(save_dir):
    if filename.endswith('.tex'):
        #print(filename)
        with open(os.path.join(save_dir, filename), 'r', encoding='utf-8') as file:
            content = file.read()
            matches = newcommand_pattern.findall(content)
            #print(matches)
            all_matches.extend(matches)  # Aggregate matches from this file

replacement_dictionary = {name: replacement for name, replacement in all_matches}


In [7]:
dict_replacem = create_replacement_dictionary(save_dir)

In [20]:
apply_replacement_to_files(save_dir, dict_replacem, polished_dir)

In [23]:
combined_file_path = 'my_papers/combined_latex_file.txt'  # Path for the combined LaTeX file

with open(combined_file_path, 'w', encoding='utf-8') as combined_file:
    first_file = True  # Flag to avoid adding separator before the first file
    for filename in os.listdir(polished_dir):
        if filename.endswith('.tex'):
            file_path = os.path.join(polished_dir, filename)
            with open(file_path, 'r', encoding='utf-8') as file:
                
                content = file.read()
                
                content = re.sub(r'\\begin\{figure(\*?)\}.*?\\end\{figure\1\}', '', content, flags=re.DOTALL)
                print(content[0:1500])

                # Patterns for abstract and section
                abstract_pattern = re.compile(r"\\begin\{abstract\}", re.IGNORECASE)
                section_pattern = re.compile(r"\\section\{")

                # Flag to mark if the abstract or section has been found
                found_abstract_or_section = False
                
                # Remove everything after \begin{thebibliography} if it exists
                content = re.split(r'\\begin\{thebibliography\}', content, maxsplit=1)[0]

                # Remove the acknowledgements section
                content = re.split(r'\\section\*?\{Acknowledgements\}', content, maxsplit=1)[0]

                # Find the first section as a fallback if no abstract is found
                section_start = re.search(r'\\section', content)
                if section_start:
                    content = content[section_start.start():]
                
                # Add separator between papers, except before the first file
                if not first_file:
                    combined_file.write("/------- NEW PAPER -------/\n\n")
                else:
                    first_file = False
                
                combined_file.write(content.strip() + "\n\n")

# Read the combined file
with open(combined_file_path, 'r', encoding='utf-8') as file:
    combined_content = file.read()

\pdfoutput=1
\documentclass[fleqn,usenatbib,useAMS]{mnras}
\usepackage{newtxtext,newtxmath}
\usepackage{amsmath,amssymb}
\usepackage[T1]{fontenc}
%\usepackage{ae,aecompl}
\usepackage{natbib}
\usepackage{epsfig}
\usepackage{graphicx}
\usepackage{tablefootnote}
%\usepackage[export]{adjustbox}
\usepackage{floatrow}
\usepackage{caption}
%\usepackage{hyperref}

\newcommand{}{\mathcal}

\title[Projected bounds on ALPs from ATHENA]{Projected bounds on ALPs from {\it Athena}}
\author[J. P. Conlon et al.]{
Joseph P. Conlon$^{1}$,
Francesca Day$^{1}$, 
Nicholas Jennings$^{1}$\thanks{E-mail: nicholas.jennings@physics.ox.ac.uk}, 
Sven Krippendorf$^{1}$
\newauthor{ and Francesco Muia$^{1}$}
\\
% List of institutions
$^{1}$Rudolf Peierls Centre for Theoretical Physics, 1 Keble Road, Oxford, OX1 3NP, UK\\
}
\date{\today}

\pubyear{2017}

\begin{document}
\label{firstpage}
\pagerange{\pageref{firstpage}--\pageref{lastpage}}
\maketitle

\begin{abstract}
Galaxy clusters represent excellent laboratories 

In [32]:
combined_file_path = 'my_papers/combined_latex_file.txt'  # Path for the combined LaTeX file

# Patterns for abstract, section, acknowledgements, and bibliography
abstract_pattern = re.compile(r"\\(?:begin\{abstract\}|abstract)", re.IGNORECASE)
section_pattern = re.compile(r"\\section\{")
acknowledgements_pattern = re.compile(r"\\(?:section|subsection|subsubsection|paragraph)\*?\s*\{(Acknowledgements|Acknowledgments)\}|\\(?:acknowledgements|acknowledgments)", re.IGNORECASE)
bibliography_pattern = re.compile(r"\\(?:begin\{thebibliography\}|bibliography)")

with open(combined_file_path, 'w', encoding='utf-8') as combined_file:
    first_file = True  # Flag to avoid adding separator before the first file
    for filename in os.listdir(polished_dir):
        if filename.endswith('.tex'):
            file_path = os.path.join(polished_dir, filename)
            with open(file_path, 'r', encoding='utf-8') as file:
                content = file.read()
                
                # Remove figure environments and commented out lines
                content = re.sub(r'\\begin\{figure(\*?)\}.*?\\end\{figure\1\}', '', content, flags=re.DOTALL)
                content = re.sub(r'^%.*\n?', '', content, flags=re.MULTILINE)
                
                # Start parsing at \begin{abstract} or the first \section{...}, if abstract is not present
                start_point = abstract_pattern.search(content) or section_pattern.search(content)
                if start_point:
                    content = content[start_point.start():]
                # Note: if neither \begin{abstract} nor \section is found, content remains unchanged
                
                # Remove everything after \begin{thebibliography}, if present
                content = bibliography_pattern.split(content)[0]

                # Remove the acknowledgements section, if present
                content = acknowledgements_pattern.split(content)[0]

                # Add separator between papers, except before the first file
                if not first_file:
                    combined_file.write(f"\n\n/------- NEW DOCUMENT - {filename} -------/\n\n")
                else:
                    first_file = False
                
                combined_file.write(content.strip() + "\n\n")


# this didn't capture the following cases:

#\section*{Acknowlegdments}
#\paragraph{Acknowledgements}
#\section*{Acknowledgments}
#\acknowledgments

In [10]:
def handle_latex_commands(text, to_remove, to_ignore, to_headline):
    """
    Remove specified LaTeX commands from the text.
    Args:
    - text (str): The input LaTeX document as a string.
    - to_remove (list): A list of commands (as regex patterns) to remove.
    
    Returns:
    - str: The text with specified commands removed.
    """
    for command in to_remove:
        pattern = r'\\' + command + r'(\[[^\]]*\])?(\{[^\}]*\})?\s*'
        text = re.sub(pattern, '', text)
    
    # Handling specific patterns with a more targeted approach
    text = re.sub(r'\\pdfoutput\s*=\s*\d\s*', '', text)
    text = re.sub(r'\\begin\{document\}\s*', '', text)
    text = re.sub(r'\\begin\{titlepage\}\s*', '', text)
    # Add or adjust patterns as needed

    # Handling commands to ignore by retaining their content
    for command in to_ignore:
        if command in ['center', 'array', 'minipage', 'titlepage']:  # Environment commands
            pattern = r'\\begin\{' + command + r'\}(.*?)\\end\{' + command + r'\}'
            text = re.sub(pattern, r'\1', text, flags=re.DOTALL)
        else:  # Text formatting commands
            # Handling the case where commands are used with curly brackets around
            text = re.sub(r'{\\' + command + r'\s+([^}]*)}', r'\1', text)
            # Handling the case where commands are used without curly brackets around
            pattern = r'\\' + command + r'\{([^}]*)\}'
            text = re.sub(pattern, r'\1', text)
            pattern = r'\\' + command + r'(\{([^}]*)\})?'
            text = re.sub(pattern, r'\1', text)        
    
    for command in to_headline:
        # Capitalize the first letter of each command for the output
        formatted_command = command.capitalize()
        # Replace command with formatted headline, including optional arguments
        text = re.sub(r'\\' + command + r'(\[[^\]]*\])?\{([^}]*)\}', r'\n' + formatted_command + r': \2\n', text)
        # Replace command with formatted headline, including optional arguments
        text = re.sub(r'\\begin\{' + command + r'\}(.*?)\\end\{' + command + r'\}', r'\n' + formatted_command + r': \1\n', text, flags=re.DOTALL)

    # Handle citations and footnotes
    text = re.sub(r'\\cite\{([^}]*)\}', r'[\1]', text)
    text = re.sub(r'\\footnote\{([^}]*)\}', r' (\1)', text)

    # Optionally, remove blank lines after processing
    text = re.sub(r'%', '', text)
    # Removing empty curly brackets with only whitespaces
    text = re.sub(r'\{\s*\}', '', text)
    text = re.sub(r'\\{2,}', '', text)
    text = re.sub(r'\n{2,}', ' ', text)
    text = re.sub(r'\s{2,}', ' ', text)


    return text

In [11]:
commands_to_remove = ['usepackage', 'documentclass', 'setcounter', 'numberwithin', 'today', 'pageref', 'thanks', 'pagerange',
                      'setlength', 'definecolor', 'newcommand', 'renewcommand', 'textwidth', 'date', 'text', 'centering',
                      'vskip', 'hskip', 'thispagestyle', 'LARGE', 'Huge', 'huge', 'Large', 'large', 'bibliographystyle', 'bibliography',
                      'normalsize', 'small', 'footnotesize', 'scriptsize', 'tiny', 'label', 'pubyear']

commands_to_ignore = ['textbf', 'mathcal', 'cal' 'textit', 'bf', 'it', 'emph', 'sl', 'sf', 'sc', 'tt', 'center', 'rm',
                      'array', 'minipage', 'titlepage', 'newauthor', 'maketitle', 'quad', 'qquad', 'Bigg', 'mbox']

commands_to_headline = ['section', 'subsection', 'subsubsection', 'paragraph', 'abstract', 'title', 'author', 'keywords', 'appendix']



In [12]:
combined_content[0:1000]

'\\section{Introduction}\n\\label{introduction}\nX-ray astronomy provides a novel arena for fundamental physics. Thanks to exciting recent data, such as the observed excess at 3.5~keV \\cite{Bulbul, Boyarsky}, there has been a renewed interest among particle physicists in the great promise of X-ray astronomy to shed light on physics beyond the Standard Model, including the existence of new particles.\n\nOne area for which X-ray astronomy is particularly suitable\n is in the search for Axion-Like Particles (ALPs).\nALPs are light pseudo-scalars that are a well motivated extension of the Standard Model \\cite{PecceiQuinn,Wilczek,Weinberg} that arise\n generically in string compactifications, for example see \\cite{hep-th/0602233,hep-th/0605206,1206.0819}. A general review of ALPs is \\cite{RingwaldReview}. In the presence of a magnetic field $\\langle B \\rangle$ ALPs and photons interconvert \\cite{Sikivie:1983ip, Raffelt:1987im}, and this induces quasi-sinusoidal oscillations at X-ray 

In [13]:
handle_latex_commands(combined_content, commands_to_remove, commands_to_ignore, commands_to_headline)



In [11]:
# Step 2: Remove figure content, then split the combined file into chunks based on section commands
section_commands = re.compile(r'\\(sub)*section{.*?}', re.DOTALL)

# Read the combined file
with open(combined_file_path, 'r', encoding='utf-8') as file:
    combined_content = file.read()

# Remove content between \begin{figure} and \end{figure}
combined_content = re.sub(r'\\begin\{figure(\*?)\}.*?\\end\{figure\1\}', '', combined_content, flags=re.DOTALL)

# Split the content into chunks
chunks = section_commands.split(combined_content)

# Filter out empty chunks
chunks = [chunk for chunk in chunks if chunk and chunk.strip()]

In [12]:
# Step 3: Store all the chunks into a DataFrame
df_chunks = pd.DataFrame({'chunk': chunks})

print(f"Total chunks created: {len(df_chunks)}")

# Optionally, save the DataFrame to a CSV file
df_chunks.to_csv('latex_chunks.csv', index=False)

Total chunks created: 1155


In [23]:
pd.set_option('display.max_colwidth', None)
display(df_chunks)  # Show the first few chunks for verification

Unnamed: 0,chunk
0,"\pdfoutput=1\n\documentclass[fleqn,usenatbib,useAMS]{mnras}\n\usepackage{newtxtext,newtxmath}\n\usepackage{amsmath,amssymb}\n\usepackage[T1]{fontenc}\n%\usepackage{ae,aecompl}\n\usepackage{natbib}\n\usepackage{epsfig}\n\usepackage{graphicx}\n\usepackage{tablefootnote}\n%\usepackage[export]{adjustbox}\n\usepackage{floatrow}\n\usepackage{caption}\n%\usepackage{hyperref}\n\n\newcommand{}{\mathcal}\n\n\title[Projected bounds on ALPs from ATHENA]{Projected bounds on ALPs from {\it Athena}}\n\author[J. P. Conlon et al.]{\nJoseph P. Conlon$^{1}$,\nFrancesca Day$^{1}$, \nNicholas Jennings$^{1}$\thanks{E-mail: nicholas.jennings@physics.ox.ac.uk}, \nSven Krippendorf$^{1}$\n\newauthor{ and Francesco Muia$^{1}$}\n\\\n% List of institutions\n$^{1}$Rudolf Peierls Centre for Theoretical Physics, 1 Keble Road, Oxford, OX1 3NP, UK\\\n}\n\date{\today}\n\n\pubyear{2017}\n\n\begin{document}\n\label{firstpage}\n\pagerange{\pageref{firstpage}--\pageref{lastpage}}\n\maketitle\n\n\begin{abstract}\nGalaxy clusters represent excellent laboratories to search for Axion-Like Particles (ALPs). They contain magnetic fields which can induce quasi-sinusoidal oscillations in the X-ray spectra of AGNs situated in or behind them. Due to its excellent \nenergy resolution, the X-ray Integral Field Unit (X-IFU) instrument onboard the {\it Athena} X-ray Observatory will be far more sensitive to ALP-induced modulations than current detectors. As a first analysis of the sensitivity of {\it Athena} to the ALP-photon coupling $g_{a \gamma \gamma}$, we simulate observations of the Seyfert galaxy NGC~1275 (hosting the radio source 3C~84) in the Perseus cluster using the SIXTE simulation software. We estimate that for a 200~ks exposure, a non-observation of spectral modulations will constrain ${g_{a\gamma\gamma}\lesssim1.5\times10^{-13}~\rm{GeV}^{-1}}$ for $m_a\lesssim10^{-12}~\rm{eV}$, representing an order of magnitude improvement over constraints derived using the current generation of satellites.\n\end{abstract}\n\n\begin{keywords}\nastroparticle physics -- elementary particles -- galaxies: clusters: individual: Perseus\n\end{keywords}\n\n"
1,"\n\label{introduction}\nX-ray astronomy provides a novel arena for fundamental physics. Thanks to exciting recent data, such as the observed excess at 3.5~keV \cite{Bulbul, Boyarsky}, there has been a renewed interest among particle physicists in the great promise of X-ray astronomy to shed light on physics beyond the Standard Model, including the existence of new particles.\n\nOne area for which X-ray astronomy is particularly suitable\n is in the search for Axion-Like Particles (ALPs).\nALPs are light pseudo-scalars that are a well motivated extension of the Standard Model \cite{PecceiQuinn,Wilczek,Weinberg} that arise\n generically in string compactifications, for example see \cite{hep-th/0602233,hep-th/0605206,1206.0819}. A general review of ALPs is \cite{RingwaldReview}. In the presence of a magnetic field $\langle B \rangle$ ALPs and photons interconvert \cite{Sikivie:1983ip, Raffelt:1987im}, and this induces quasi-sinusoidal oscillations at X-ray energies in the spectra of sources in and around galaxy clusters \cite{1304.0989, 1509.06748}.\n\nSearches for these oscillations can be used to constrain ALP parameter space.\nCurrent constraints on ALPs derived in this fashion \cite{1304.0989, Berg:2016ese, Marsh:2017yvc,Conlon:2017qcw} are based on data taken with CCD detectors, which have an energy resolution of $\mathcal{O}(100~\rm{eV})$. A large improvement with sensitivity will be achieved once data becomes available from microcalorimeters with $\mathcal{O}({\rm a~few} \, \rm{eV})$ energy resolution.\nSuch microcalorimeters will be on board the Advanced Telescope for High ENergy Astrophysics (ATHENA), currently scheduled to launch in 2028.\nIts X-IFU instrument will have both large effective area, good imaging and energy resolution of $\sim 2.5 \rm{eV}$, greatly enhancing the discovery potential for ALPs.\n\nIn this paper we provide a first estimate for the experimental sensitivity of {\it Athena} to ALPs. We do so using simulated data for a mock observation of NGC~1275, hosting the radio source 3C~84, which contains the central AGN of the Perseus cluster.\nThis object was chosen as we have previously used it to place bounds on ALPs using {\it Chandra} data \cite{Berg:2016ese}.\n\n"
2,"\n\label{alps}\nAn ALP $a$ couples to electromagnetism through the Lagrangian term:\n\begin{equation}\n\label{ALPphoton}\n\qquad L = \frac{1}{4 M}~a~F_{\mu \nu} \tilde{F}^{\mu \nu} = \frac{1}{M}~a~{\bf E} \cdot {\bf B}~,\n\end{equation}\nwhere ${M^{-1} = g_{a\gamma\gamma}}$ parametrises the strength of the interaction,\nand ${\bf E}$ and ${\bf B}$ are the electric and magnetic fields.\nAs their potential and interactions are protected by shift symmetries, ALPs can naturally have very small masses $m_a$. The probability of ALP-photon interaction in the presence of an external magnetic field $\langle B \rangle$ is a standard result \cite{Sikivie:1983ip, Raffelt:1987im}. \n\nThe full analytic expression for the probability of an ALP being converted to a photon after propagating through a single magnetic field domain of length $L$ is:\n\begin{equation}\n\qquad P_{a \rightarrow \gamma} = \frac{1}{2}\frac{\Theta^2}{1 + \Theta^2}\sin^2 \left( \Delta \sqrt{1 + \Theta^2} \right),\n\end{equation}\nwhere\n\begin{equation}\n\qquad \Theta = 0.28 \Bigg(\frac{B_{\perp}}{1 \mu\rm{G}}\Bigg)\Bigg(\frac{\omega}{1 \, \rm{keV}}\Bigg)\Bigg(\frac{10^{-3} \rm{cm}^{-3}}{n_e}\Bigg)\Bigg(\frac{10^{11} \rm{GeV}}{M}\Bigg),\n\end{equation}\n\begin{equation}\n\qquad \Delta = 0.54 \Bigg(\frac{n_e}{10^{-3} \rm{cm}^{-3}}\Bigg)\Bigg(\frac{L}{10 \, \rm{kpc}}\Bigg)\Bigg(\frac{1 \rm{keV}}{\omega}\Bigg).\n\end{equation}\nHere $B_{\perp}$ denotes the magnetic field component perpendicular to the ALP wave vector, $\omega$ is the energy and $n_e$ is the electron density. In the limit $\Delta, \Theta \ll 1$, $P \propto B^2 L^2 / M^2$. However when $\Theta < 1$ but $\Delta > 1$, then\n$ P \propto \Theta^2 \sin^2 \Delta$.\nThis probability grows with energy, containing oscillations that are rapid at low energies and broader at higher energies. These\noscillations leave a distinctive imprint on otherwise featureless spectra, and their absence allows us to constrain $g_{a\gamma\gamma}$.\n\nThis photon-ALP interconversion is particularly efficient in galaxy clusters (e.g. see ~\cite{0902.2320,1305.3603}).\nClusters have ${\bf B}$ fields of order $\sim \mu$G which extend over megaparsec scales, within which the magnetic field coherence lengths reach tens of kiloparsecs.\nThe relatively low electron densities ($\sim 10^{-3}\rm{cm}^{-3}$) also implies that it is at X-ray energies that the `sweet spot' of large\n $\Delta$, small $\Theta$, and quasi-sinusoidal energy-dependent $P_{\gamma \leftrightarrow a}$ is located ~\cite{1304.0989, 1305.3603, 1312.3947, 1509.06748}.\n\nThe 3D structure of intracluster magnetic fields is in general not known and so\nthe precise form of the survival probability along any single line of sight cannot be determined. Figure~\ref{fig:ALPPhotonConversion} illustrates the energy-dependent survival probability for a photon passing across three hundred domains of a magnetic field, with the direction of the magnetic\nfield randomised within each domain. The electron density and magnetic field strength in\nthe model are based on those applicable in the Perseus cluster, but the pattern of smaller, rapid oscillations at low energies and slow oscillations with greater amplitude at high energies is generic.\n\nActive Galactic Nuclei (AGNs) situated in or behind galaxy clusters provide excellent X-ray sources to search for such spectral modulations. One outstanding example is the bright central AGN of the Perseus cluster, at the heart of the galaxy NGC~1275.\nIts intrinsic spectrum is well described by an absorbed power law \cite{Churazov:2003hr,Yamazaki, Balmaverde2006, Fabian:2015kua}, and dominates the background cluster emission. The central cluster magnetic field value is estimated at $ \sim 25 \mu$G by \cite{0602622}.\n\nAn analysis of archival data of observations of NGC~1275 by the {\it Chandra} and {\it XMM-Newton} satellites was done in \cite{Berg:2016ese}\n(see \cite{1603.06978} for a related analysis of NGC~1275 in gamma rays).\nExtending methods pioneered in \cite{1304.0989}, the constraint on the ALP-photon coupling ${g_{a\gamma\gamma} \lesssim 1.5 \times 10^{-12}~{\rm GeV}^{-1}}$ was found. For M87, a similar treatment was performed in \cite{Marsh:2017yvc}, finding a\nbound ${g_{a\gamma\gamma} \lesssim 1.5 \times 10^{-12}~{\rm GeV}^{-1}}$. An analysis of {\it Chandra} data of other bright point sources in galaxy clusters was conducted in (\cite{Conlon:2017qcw}), deriving bounds of ${g_{a\gamma\gamma} \lesssim 1.5 \times 10^{-12}~{\rm GeV}^{-1}}$ (for the Seyfert galaxy 2E~3140) and ${g_{a\gamma\gamma} \lesssim 2.4 \times 10^{-12}~{\rm GeV}^{-1}}$ (for the AGN NGC~3862).\n\n%%{\bf These bounds are superior to those derived from SN 1987A, and are similar to IAXO in this low mass region. The absence of CMB distortions %\cite{Mirizzi:2009aj, Tashiro:2013yea} \n%%constrain the product $g B < 10^{-13} \text{GeV}^{-1} \text{nG}$, which are competitive with bounds from galaxy clusters if the cosmic magnetic field saturates the observed bound < nG. This is complementary to DM haloscopes searches.}\n\nThese bounds all hold for light ALPs with masses $m_a \lesssim 10^{-12} {\rm eV}$. This implies that these methods are not sensitive\nto an ordinary QCD axion, which for a photon couplings $g_{a\gamma\gamma} \sim 10^{-12} {\rm GeV}^{-1}$ would typically have $m_a \sim 10^{-3} {\rm eV}$. However, unconventional models for the QCD axion where the photon coupling is significantly enhanced compared to naive expectation may\nbe constrained using these techniques.\n\nThe bounds produced are superior to the bound on light ALPs derived from SN 1987A of $g_{a \gamma \gamma} < 5 \times 10^{-12} \text{GeV}^{-1}$ \cite{Payez:2014xsa}, and are similar to those projected for IAXO in this low mass region \cite{Irastorza:2012qf}. The bounds are also superior to those inferred from the absence of CMB distortions in \mbox{COBE FIRAS} data \cite{Mirizzi:2009nq}, which constrain the product $g_{a \gamma \gamma} B < 10^{-11} \text{GeV}^{-1} \text{nG}$. Here $B$ is the strength of the cosmic magnetic field, which is limited to $B<\text{nG}$.\n\nOne major limiting constraint on existing data is the energy resolution of the detectors.\nIf they exist, ALPs provide oscillatory structure all the way down to the lowest energies.\nHowever, as illustrated in Figure~\ref{fig:ALPPhotonConversion}, detectors with energy resolutions of $\mathcal{O}(100~\rm{eV})$ cannot resolve this structure at lower energies -- but this does become accessible once a resolution of $\mathcal{O}(2.5~\rm{eV})$ is achieved. We now discuss the future {\it Athena} X-ray observatory, whose greatly enhanced technical capabilities offer improved sensitivity to ALP-photon interconversion.\n\n\n"
3,"}\n\label{athena}\nThe Advanced Telescope for High ENergy Astrophysics (ATHENA) is an ESA mission to explore the Hot and Energetic Universe, due to launch in 2028 \cite{Nandra:2013shg}. The mirror will have a $2~\rm{m}^2$ effective area and a 5~arcsec angular resolution. There are two instruments: the X-ray Integral Field Unit (X-IFU) and the Wide Field Imager (WFI). Here we focus on the former, which will consist of an array of TiAu Transition Edge Sensor (TES) micro-calorimeters sensitive to the energy range 0.2--12~keV \cite{Barret:2016ett}. When operated at a temperature of 50 mK, these can achieve an energy resolution of 2.5~eV below 7~keV \cite{Gottardi:2016cdx}, implying X-IFU will be able to resolve narrow spectral oscillations. A readout time of $\sim10~\mu\rm{s}$ will ensure pileup contamination is minimised. Table~\ref{satellites} contains\na summary of its properties, taken from the {\it Athena} Mission Proposal\footnote{http://www.the-athena-x-ray-observatory.eu/images/AthenaPapers/ \\ The\_Athena\_Mission\_Proposal.pdf}, compared to properties of the {\it Chandra} ACIS-I detector, taken from the {\it Chandra} Proposer's Guide\footnote{http://cxc.harvard.edu/proposer/POG/html/chap6.html}.\n\n\begin{table}\n\n\centering\n\begin{tabular}{r|c|c}\n& {\it Athena} (X-IFU) & {\it Chandra} (ACIS-I)\\\n%& (X-IFU) & (ACIS-I)\\\n\hline\hline\nEnergy range & 0.2--12 keV & 0.3--10 keV\\ \hline\nEnergy resolution & 2.5 eV & 150 eV\\ \n at 6 keV & & \\ \hline\nSpatial resolution & 5 arcsec & 0.5 arcsec\\ \hline\nTime resolution & 10~$\mu$s & 0.2 s\\\n& & (2.8~ms single row)\\ \hline\nEffective area & 2~m$^2$ @ 1 keV & 600~cm$^2$ @ 1.5 keV \\ \hline\n\end{tabular}\n\caption{Parameters taken from the {\it Athena} Mission Proposal and the {\it Chandra} Proposer's Guide.}\n\label{satellites}\n\end{table}\n\nThe combination of larger effective area, greatly improved energy resolution and reduced pileup contamination means {\it Athena} has far more potential to detect ALP-induced oscillations than the best current satellites. The aim of this paper is\nto make the first quantitative estimate of the extent to which {\it Athena} will be able to improve constraints on\n$g_{a\gamma\gamma}$.\n\n"
4,"\n\label{bounds}\nIn terms of estimating bounds on $g_{a\gamma\gamma}$ we use the same method as previously applied with\n{\it Chandra} data \cite{Berg:2016ese}. This allows for a direct comparison\nbetween the capabilities of {\it Chandra} and {\it Athena} in terms of placing bounds.\n\nWe simulate {\it Athena} observations of NGC~1275, using two models for the photon spectra of the AGN.\nThe first is a standard spectrum without ALPs, and the second is a model with the same spectrum multiplied with the\nphoton survival probability distribution as introduced in Section~\ref{alps}. Using simulations of the\nX-IFU detector response, we fit spectra generated assuming ALP-photon conversion with the model without ALPs (Model 0) and then we compare this fit to the fit of the spectrum generated without ALPs to the same model.\nTo allow for the uncertainty in the\nmagnetic field configuration along the line of sight, we repeat this analysis using many different randomly generated magnetic fields.\n\nThe two photon spectra that we model are:\n\begin{enumerate}\n\item Model 0: An absorbed power law plus thermal background:\n\begin{equation}\n\qquad F_{0}(E) = (A E^ {- \gamma} + \mathtt{BAPEC}) \times e^{-n_{H} \sigma(E,z)},\n\end{equation}\nwhere $A$ and $\gamma$ are the amplitude and index of the power law, $E$ is the energy, $n_H$ is the equivalent hydrogen column, $\sigma(E, z)$ is the photo-electric cross-section at redshift $z$, and $\mathtt{BAPEC}$ is the standard plasma thermal emission model.\n\item Model 1: An absorbed power law plus thermal background, multiplied by a table of survival probabilities for photons of different energies:\n\begin{equation}\nF_{1}(E, {\bf B}) = (A E^ {- \gamma} + \mathtt{BAPEC}) \times e^{-n_{H} \sigma(E,z)} \times P_{\gamma \to \gamma} (E (1 + z), { \bf B}, g_{a \gamma \gamma})~.\n\end{equation}\n\end{enumerate}\nThe index of the power law was set based on the best fit value from the cleanest {\it Chandra} observations of NGC~1275, and its normalisation was determined based on the {\it Hitomi} 230~ks observation of Perseus in 2016 \cite{Aharonian:2016gzq}. As the AGN in 2016 was\nroughly twice as bright as in 2009 and it has previously exhibited large historical variation \cite{Fabian:2015kua}, it may be again much brighter (or dimmer) in 2028, which would affect both the contrast\nagainst the cluster background and also the observation time required to achieve a certain constraint on $g_{a \gamma \gamma}$.\n\nThe 2016 {\it Hitomi} observation also constrained the temperature, abundances and velocity dispersion of the cluster thermal emission to a high degree of accuracy \cite{Aharonian:2016gzq}.\nFor the spectral shape of the cluster background, we used the single-temperature $\mathtt{bapec}$ model that was a good fit\nto the {\it Hitomi} spectrum across its field of view. While this single-temperature model is unlikely to be a good fit for the background\ncontiguous to the AGN, it represents a useful proxy for the actual background that can only be determined at the time.\nThe normalisation of the background was set by extracting a circular region\nof the cluster emission close to the AGN from the {\it Chandra} observations, of radius equal to the angular resolution of {\it Athena}, and determining the best fit. All model parameters are shown in Table \ref{parameters}.\n\begin{table}\n\centering\n\begin{tabular}{l|l|c|c}\nModel & parameter & symbol & value\\ \hline \hline\n$\mathtt{zwabs}$ & nH column density & $n_H$ & $0.24 \times 10^{22} \rm{cm}^{-2}$\\\n & redshift & z & 0.0176\\ \hline\n$\mathtt{powerlaw}$ & index & $\gamma$ & 1.8\\\n & normalisation & A & $9 \times 10^{-3}$\\ \hline\n$\mathtt{bapec}$ & temperature & kT & 3.48 keV\\\n & abundances & & 0.54 solar\\\n & velocity dispersion & v & 178 m \,${\rm s}^{-1}$\\\n& normalisation & N & $9 \times 10^{-4}$\n\end{tabular}\n\caption{Parameters of the absorbed power law describing the spectrum of NGC~1275, and the thermal model of the cluster background.}\n\label{parameters}\n\end{table}\n\nAs for the study with {\it Chandra}, we take the central magnetic field value as $B_0\sim 25\mu $G, following \cite{0602622}. We also\nassume that $B$ decreases with radius as $B \propto n_{e}^{0.7}$.\nAs there is not a direct measurement of the power spectrum and coherence length for the Perseus magnetic field, we base the model on those inferred for the cool core cluster A2199 \cite{Vacca:2012up}.\n\nThe electron density $n_{e}$ has the radial distribution found in \cite{Churazov:2003hr}:\n\begin{equation}\n\qquad n_{e} (r) = \frac{3.9 \times 10^{-2}}{ [ 1 + (\frac{r}{80 \, {\rm kpc}})^2]^{1.8}} + \frac{4.05 \times 10^{-3}}{ [ 1 + (\frac{r}{280 \, {\rm kpc}})^2]^{0.87}} \, {\rm cm}^{-3}.\n\end{equation}\n\nThe magnetic field is generated over 300 domains, whose lengths are drawn from a Pareto distribution between $3.5~\rm{kpc}$ and $10~\rm{kpc}$ with power 2.8. In each domain the magnetic field and electron density are constant, with a random direction of ${\bf B}$. We then\ncalculate the survival probability of a photon passing through this region, as described in \cite{1312.3947}.\n\nThe simulations were performed using the Simulation of X-ray Telescopes ($\mathtt{SIXTE}$) code, a multi-instrument simulation package. It aims to offer an end-to-end simulation, i.e. the full detector chain from the source to the final data. It models the telescope's vignetting, ARF and PSF, and X-IFU's response, event reconstruction and pileup \cite{2014SPIE.9144E..5XW}.\n\nThe spectrum of NGC~1275, and the cluster background, were modelled in $\mathtt{XSPEC}$\footnote{https://heasarc.gsfc.nasa.gov/xanadu/xspec/manual/manual.html} as an absorbed power law plus a thermal component, $\mathtt{zwabs*(powerlaw + bapec)}$. This spectrum, either multiplied with the photon survival probabilities or not, was converted to the SIMPUT\footnote{http://hea-www.harvard.edu/heasarc/formats/simput-1.0.0.pdf} file format using the command $\mathtt{simputfile}$. The mirror and detector response were modelled with $\mathtt{xifupipeline}$, using the ARF file $\mathtt{athena\_xifu\_1469\_onaxis\_pitch249um\_v20160401.arf}$ and the RMF file $\mathtt{athena\_xifu\_rmf\_v20160401.rmf}$. This generated an event FITS file, which was then converted into a PHA file using $\mathtt{makespec}$. We produced a fit to this spectrum in $\mathtt{XSPEC}$, using the Levenberg-Marquardt fitting method to calculate the reduced $\chi^2$. Figure~\ref{spectrum} shows one simulation for ${g_{a \gamma \gamma} = 3 \times 10^{-13} {\rm GeV}^{-1}}$ and its fit to an absorbed power law.\n\n\n\nWe use the following procedure to determine whether a particular value of $g_{a \gamma \gamma}$ is excluded: we varied the ALP-photon coupling $g_{a \gamma \gamma}$ from $g_{a \gamma \gamma} = 5 \times 10^{-13} \, \text{GeV}^{-1}$ to $g_{a \gamma \gamma} = 1\times 10^{-13} \, \text{GeV}^{-1}$, with stepsize $0.5 \times 10^{-13} \, \text{GeV}^{-1}$. As the bound is dependent on uncertainties in the magnetic field strength of a factor of 2, and we are only using simulated data, we do not consider step sizes smaller than this. For each $g_{a \gamma \gamma}$:\n\begin{enumerate}\n\item Generate 50 configurations of the magnetic field $B_i$.\n\item Use the $B_i$ to calculate the survival probability $P_{\gamma \rightarrow \gamma}$ along the line of sight for different photon energies (as done in \cite{1312.3947}). We calculate for 8000 equally spaced photon energies in the range 0.01--10~keV.\n\item Combine each $P_{\gamma \rightarrow \gamma}$ with the AGN spectrum.\n\item Generate 10 fake PHAs for each spectrum, providing 500 fake data samples in total.\n\item Fit the fake data to Model 0, and calculate the reduced chi-squareds $\chi_1^2$.\n\item Generate 100 fake PHAs based on Model 0, and compute the average of their reduced chi-squareds $\chi_0^2$.\nAssuming the absence of ALPs, this represents the expected quality of the fit to the single real data set. If the actual data is a poor fit\nfor some reason, then this will weaken the level of the resulting bounds that we can produce.\n\item Determine the percentage of fake data sets that have a reduced chi-squared $\chi_1^2 < \rm{max}(\langle \chi_0^2 \rangle,1)$. If this is true for fewer than 5 per cent of the data sets, the value of $g_{a \gamma \gamma}$ is excluded at 95 per cent confidence.\n\end{enumerate}\n\nFor a simulation of 200~ks of data with the nominal mirror configuration, we derive a projected\nbound of ${g_{a\gamma\gamma} \lesssim 1.5 \times 10^{-13}~ \rm{GeV}^{-1}}$ at 95 per cent confidence and of ${g_{a\gamma\gamma} \lesssim 2.5 \times 10^{-13}~ \rm{GeV}^{-1}}$ at 99\% confidence, as shown in Fig.~\ref{fig:ExclusionLimit} alongside published data limits. This represents an order of magnitude improvement over the bound derived from the 200~ks of Chandra ACIS-I observations in \cite{Berg:2016ese}. We also find that even\na short 10~ks observation will lead to an improved bound of ${g_{a\gamma\gamma} \lesssim 4.5 \times 10^{-13}~ \rm{GeV}^{-1}}$.\n\nThese bounds are substantially better than any current experimental or astrophysical bound, and also go beyond the capabilities of IAXO for ultralight ALP masses. The proposed DM haloscope ABRACADABRA has the potential to explore $g_{a \gamma \gamma}$ down to $10^{-17} \text{GeV}^{-1}$ for $m_a \in [10^{-14},10^{-6}] \text{eV}$ \cite{Kahn:2016aff}, if ALPs constitute the Dark Matter. The existence of ALP-induced oscillations in galaxy clusters is independent of this. Proposed CMB experiments such as PIXIE \cite{Kogut:2011xw} and PRISM \cite{Andre:2013afa} could produce a constraint $g_{a \gamma \gamma} B < 10^{-16} \text{GeV}^{-1} \text{nG}$ which might be competitive with bounds from galaxy clusters if the cosmic magnetic field is close enough to saturation $\sim \text{nG}$ \cite{Tashiro:2013yea}. Black hole superradiance also offers tentative constraints ALPs on in the mass range $m_a \in [10^{-14},10^{-10}] \text{eV}$, depending on measurements of black hole spin \cite{Arvanitaki:2016qwi}.\n\n\n\n"
...,...
1150,sub
1151,"\n\label{sssec:numericalresults}\n\nIn this Section, we numerically analyse the parameters of the model so that the following requirements are satisfied: \n\begin{itemize}\n\item[a)] A successful model with around $60$ e-foldings of inflation that creates density perturbations of the correct size with\nall underlying parameters in their natural range;\n\n\item[b)] Low-energy gauginos which are well motivated by gauge coupling unification;\n\n\item[c)] A correct generation of the observed BAU, $n_\B/s \simeq 10^{-10}$, via the AD mechanism.\n\end{itemize}\n\nRequirement $a)$ has already been studied in Sec. \ref{ssec:KMI}. For concreteness, we consider the points in the parameter space listed in Tab. \ref{tab:tab1}. Scalar masses are completely determined by requirement $a)$ since, as we have shown in (\ref{sssec:scalarmasses}), they depend only on $W_0$ and ${V}$ once the string coupling constant has been fixed. On the contrary, requirement $b)$ can be easily fulfilled using the additional freedom of gaugino masses: the possibility to vary $\lambda(U,S)$ in (\ref{eq:gauginomasses}) by tuning background fluxes. In particular we require that $M = 5 \times 10^3 \, \rm GeV$ when $W_0 = 100$ and the value of the volume is the corresponding $\left.{V}\right|_{\scriptscriptstyle \rm COBE}$ in case $(C)$ of Tab. \ref{tab:tab1}. In order for requirement $c)$ to be fulfilled, it is necessary to find the exact value of the AD field displacement $\phi_0/M_p$ such that the baryon asymmetry estimated in (\ref{bau1}) matches the measured value. We focus on the split SUSY case where late-time scalars are non-tachyonic while the AD field during inflation becomes tachyonic. Moreover we assume that the A-terms are determined solely by the first term in (\ref{eq:atermsdilaton}). We stress that these choices do not affect the qualitative behaviour of our final results. \n\nIn Fig.~\ref{fig:plot1} we illustrate the correlation between the produced baryon asymmetry and the gaugino masses in the split SUSY case. For the sake of concreteness we choose to work in the dS$_1$ scenario but the results are not dramatically affected by changing the dS sector. Differently coloured bands in Fig.~\ref{fig:plot1} correspond to different ranges for the reheating temperature. The dotted black lines correspond to constant values of $W_0$ in the natural range: $1, 10, 100$ from left to right. The continuous blue line corresponds to the locus where the amplitude of the density perturbations matches the measured value. It intersects the dotted black lines in the blue dots which respectively correspond to the cases $(A), (B), (C)$ in Tab. \ref{tab:tab1}. In Tab.~\ref{tab:tab2} we report the values of scalar masses, which are around $10^{9-10}$ GeV, the reheating temperature, which is larger than $100$ GeV, and the displacement of the AD field. Notice that it is possible to satisfy the requirements $a)$, $b)$ and $c)$ for natural ${O}(1)$ values of the parameter $A_n$ and for $\phi_0 \sim 0.1\,M_p$. Moreover $T_{\rm rh}$ shown in Tab.~\ref{tab:tab2} and given in~(\ref{eq:treheatingmod}) is completely determined by the requirement of getting the right amplitude of density perturbations.\n\n\n\n\n\n\begin{table}[h!]\n\begin{center}\n\begin{tabular}{ccccc}\n\hline\n & $M \, [\rm{GeV}]$ & $m_0 \, [\rm{GeV}]$ & $T_{\rm rh} \, [\rm{GeV}]$ & $\phi_0/M_p$\\\n\hline\n$(A)$ & $5.4 \times 10^5$ & $3 \times 10^{10}$ & $6.7 \times 10^3$ & $0.03$ \\\n\hline\n$(B)$ & $5.2 \times 10^4$ & $9.2 \times 10^9$ & $1.1 \times 10^3$ & $0.08$ \\\n\hline\n$(C)$ & $5 \times 10^3$ & $2.8 \times 10^9$ & $195$ & $0.19$ \\\n\hline\n\end{tabular}\n\end{center}\n\caption{Gaugino masses $M$, scalar masses $m_0$, reheating temperature $T_{\rm rh}$ and displacement $\phi_0/M_p$ needed to match the measured amplitude of density perturbations for the cases listed in Tab.~\ref{tab:tab1}.}\n\label{tab:tab2}\n\end{table}\n\n\n"
1152,sub
1153,"\n\nIn order to determine whether the DM relic abundance has a thermal or non-thermal origin, we have to compare $T_{\rm rh}$ with the DM freeze-out temperature $T_{\rm f} \sim m_\DM/20$. If $T_{\rm rh} \, > \, T_{\rm f}$, the DM content is set by thermal freeze-out while, for $T_{\rm rh} \, < \, T_{\rm f}$, the DM abundance is produced non-thermally from the decay of the lightest modulus. Since the lowest reheating temperature that is compatible with successful inflation and baryogenesis is $T_{\rm rh} \, \simeq \, 195$ GeV, the non-thermal mechanism requires $m_\DM \, > \, 3.9$ TeV. Due to the gravity-mediated pattern of gaugino masses, the lightest gaugino is the Bino, and hence the DM candidate in our model is either a Bino- or a Higgsino-like neutralino. Binos typically have a small annihilation rate, $\langle \sigma_{\rm ann} v \rangle \, < \, 3 \times 10^{-26}$ cm$^3$ s$^{-1}$, especially for a split SUSY spectrum because of the extremely heavy sparticles. For Higgsinos with a mass above $\simeq 1.2$ TeV, we also have $\langle \sigma_{\rm ann} v \rangle \, < \, 3 \times 10^{-26}$ cm$^3$ s$^{-1}$.\n\nBecause of the smallness of the annihilation rate, non-thermal DM production must proceed through the `Branching' scenario where the correct relic abundance is produced directly from the decay of the lightest modulus~\cite{NonThDMinSeqLVS}. In this scenario, the DM abundance is given by:\n\begin{equation} \label{prodabun}\n\left({n_\DM \over s}\right)_{\rm non-th} = {3 T_{\rm rh} \over 4 m_\chi} ~ {\rm Br}_\DM \,,\n\end{equation}\nwhere ${\rm Br}_\DM$ is the branching ratio for producing $R$-parity odd particles (which eventually decay to the DM particle) from modulus decay. Even allowing for ${\rm Br}_\DM \sim 10^{-3}$, which is the smallest value allowed in this scenario~\cite{ADS}, and after using the values in Tab. \ref{tab:tab2}, we find that the `Branching' scenario would lead to DM overproduction by few orders of magnitude above the observed value: \n\begin{equation} \label{obsabun}\n\left({n_\DM \over s}\right)_{\rm obs} \simeq 5 \times 10^{-10} ~ \left({1 ~ {\rm GeV} \over m_\DM}\right)\,.\n\end{equation}\nThis implies that non-thermal DM is not compatible with inflation and baryogenesis in this model. We are therefore forced to consider thermal Higgsino DM with $m_\DM \simeq 1.2$ TeV where thermal freeze-out can produce the right DM abundance. For $m_\DM < 1.2$ TeV, the Higgsino is thermally underproduced, and so we need to consider mixed DM, as in the axion-Higgsino scenario~\cite{Howie}. \n\nRegarding the production of dark radiation, it has recently been shown \cite{Cicoli:2015bpq} that split SUSY models arising in sequestered string compactifications do not feature any overproduction. This is due to the large suppression of the excess of the effective neutrino number $\Delta N_{\rm eff}$ coming from the decay of $\chi$ into MSSM scalars, which is allowed in a vast region of the parameter space.\n\nFinally we would like to comment on obtaining a large VEV for the AD field and possible implications for the DM content of the universe. It is seen in Tab. \ref{tab:tab2} that the generation of the observed BAU needs $m_\phi \sim 10^9$-$10^{10}$ GeV and $\phi_0 \sim 0.1$ $M_p$. It is possible to get $\phi_0$ in this ballpark, see~(\ref{initial}), if the AD field is lifted by a non-renormalisable term of level $n = 9$ where $\lambda_9 \sim 1$.\footnote{In fact, all of the MSSM flat directions are lifted at this level if the superpotential includes all higher-order terms that are compatible with gauge symmetry~\cite{gkm}.} In this case, depending on the Higgsino mass, one can have either Higgsino or mixed DM scenario as mentioned above. \n\nOne may also obtain the required value of $\phi_0$ if the AD field is lifted by a renormalisable term with $n = 3$. However, in this case, a very small coupling $\lambda_3 \sim 10^{-8}-10^{-7}$ is needed. This is much smaller than all of the SM Yukawa couplings, but it may arise from renormalisable superpotential terms that violate $R$-parity (namely $LLE$, $UDD$, $QLD$ terms). Such terms destabilise the Higgsino, and a question is whether this can lead to a cosmologically consistent scenario. To answer this, let us consider the situation in the presence of the $LLE$ term. In this case, the Higgsino can decay to three leptons via an off-shell slepton. The decay rate is $\Gamma_{\tilde H} \sim (\lambda_3 y_l)^2 m^5_{\tilde H}/(8 \pi \cdot 32 \pi^2) m^4_{\tilde l}$, where $y_l$ is a leptonic Yukawa coupling, $m_{\tilde H}$ and $m_{\tilde l}$ denote the Higgsino and slepton masses respectively, and the factor of $32 \pi^2$ arises due to the three-body final state. For $\lambda_3 \sim 10^{-7}$, $y_l \sim 10^{-2}$, $m_{\tilde l} \sim 10^{10}$ GeV, and $m_{\tilde H} \lesssim 200$ GeV, we may find a decay lifetime $\tau_{\tilde H} \gtrsim 10^{27}$ sec. This is compatible with the tightest cosmological bounds on decaying DM from the cosmic microwave background~\cite{slatyer}. The DM content of the universe can be explained within a mixed scenario where the Higgsino is the sub-dominant component. \n\n"


In [13]:
def find_math_expressions(text):
    # Pattern to match LaTeX math environments and inline math
    patterns = [
        r'\$.*?\$',  # Inline math
        r'\\begin\{equation\}.*?\\end\{equation\}',  # Equation environment
        r'\\begin\{eqnarray\}.*?\\end\{eqnarray\}',  # Eqnarray environment
        r'\\begin\{align\}.*?\\end\{align\}',  # Align environment
        # Add more environments as needed
    ]
    combined_pattern = '|'.join(patterns)
    
    # Find all matches and return them
    return [(m.start(), m.end()) for m in re.finditer(combined_pattern, text, flags=re.DOTALL)]

In [14]:
def split_text_preserving_math(text, max_length=3000):
    math_expressions = find_math_expressions(text)
    chunks = []
    current_chunk = ""
    last_index = 0
    
    for start, end in math_expressions:
        # Add text before the math expression to the chunk
        current_chunk += text[last_index:start]
        # Check if current chunk exceeds max length
        if len(current_chunk) > max_length:
            chunks.append(current_chunk)
            current_chunk = ""
        # Add the math expression to the chunk
        current_chunk += text[start:end]
        last_index = end
    
    # Add remaining text after the last math expression
    remaining_text = text[last_index:]
    sentences = re.split(r'(?<=\.)\s', remaining_text)
    for sentence in sentences:
        if len(current_chunk) + len(sentence) > max_length and current_chunk:
            chunks.append(current_chunk)
            current_chunk = ""
        current_chunk += sentence + " "
    
    if current_chunk:
        chunks.append(current_chunk)
        
    return chunks

In [15]:
new_chunks = []
for text in df_chunks['chunk']:
    if len(text) > 3000:
        smaller_chunks = split_text_preserving_math(text)
        new_chunks.extend(smaller_chunks)
    else:
        new_chunks.append(text)

df_new_chunks = pd.DataFrame({'chunk': new_chunks})


In [16]:
df_new_chunks

Unnamed: 0,chunk
0,"\pdfoutput=1\n\documentclass[fleqn,usenatbib,useAMS]{mnras}\n\usepackage{newtxtext,newtxmath}\n\usepackage{amsmath,amssymb}\n\usepackage[T1]{fontenc}\n%\usepackage{ae,aecompl}\n\usepackage{natbib}\n\usepackage{epsfig}\n\usepackage{graphicx}\n\usepackage{tablefootnote}\n%\usepackage[export]{adjustbox}\n\usepackage{floatrow}\n\usepackage{caption}\n%\usepackage{hyperref}\n\n\newcommand{}{\mathcal}\n\n\title[Projected bounds on ALPs from ATHENA]{Projected bounds on ALPs from {\it Athena}}\n\author[J. P. Conlon et al.]{\nJoseph P. Conlon$^{1}$,\nFrancesca Day$^{1}$, \nNicholas Jennings$^{1}$\thanks{E-mail: nicholas.jennings@physics.ox.ac.uk}, \nSven Krippendorf$^{1}$\n\newauthor{ and Francesco Muia$^{1}$}\n\\\n% List of institutions\n$^{1}$Rudolf Peierls Centre for Theoretical Physics, 1 Keble Road, Oxford, OX1 3NP, UK\\\n}\n\date{\today}\n\n\pubyear{2017}\n\n\begin{document}\n\label{firstpage}\n\pagerange{\pageref{firstpage}--\pageref{lastpage}}\n\maketitle\n\n\begin{abstract}\nGalaxy clusters represent excellent laboratories to search for Axion-Like Particles (ALPs). They contain magnetic fields which can induce quasi-sinusoidal oscillations in the X-ray spectra of AGNs situated in or behind them. Due to its excellent \nenergy resolution, the X-ray Integral Field Unit (X-IFU) instrument onboard the {\it Athena} X-ray Observatory will be far more sensitive to ALP-induced modulations than current detectors. As a first analysis of the sensitivity of {\it Athena} to the ALP-photon coupling $g_{a \gamma \gamma}$, we simulate observations of the Seyfert galaxy NGC~1275 (hosting the radio source 3C~84) in the Perseus cluster using the SIXTE simulation software. We estimate that for a 200~ks exposure, a non-observation of spectral modulations will constrain ${g_{a\gamma\gamma}\lesssim1.5\times10^{-13}~\rm{GeV}^{-1}}$ for $m_a\lesssim10^{-12}~\rm{eV}$, representing an order of magnitude improvement over constraints derived using the current generation of satellites.\n\end{abstract}\n\n\begin{keywords}\nastroparticle physics -- elementary particles -- galaxies: clusters: individual: Perseus\n\end{keywords}\n\n"
1,"\n\label{introduction}\nX-ray astronomy provides a novel arena for fundamental physics. Thanks to exciting recent data, such as the observed excess at 3.5~keV \cite{Bulbul, Boyarsky}, there has been a renewed interest among particle physicists in the great promise of X-ray astronomy to shed light on physics beyond the Standard Model, including the existence of new particles.\n\nOne area for which X-ray astronomy is particularly suitable\n is in the search for Axion-Like Particles (ALPs).\nALPs are light pseudo-scalars that are a well motivated extension of the Standard Model \cite{PecceiQuinn,Wilczek,Weinberg} that arise\n generically in string compactifications, for example see \cite{hep-th/0602233,hep-th/0605206,1206.0819}. A general review of ALPs is \cite{RingwaldReview}. In the presence of a magnetic field $\langle B \rangle$ ALPs and photons interconvert \cite{Sikivie:1983ip, Raffelt:1987im}, and this induces quasi-sinusoidal oscillations at X-ray energies in the spectra of sources in and around galaxy clusters \cite{1304.0989, 1509.06748}.\n\nSearches for these oscillations can be used to constrain ALP parameter space.\nCurrent constraints on ALPs derived in this fashion \cite{1304.0989, Berg:2016ese, Marsh:2017yvc,Conlon:2017qcw} are based on data taken with CCD detectors, which have an energy resolution of $\mathcal{O}(100~\rm{eV})$. A large improvement with sensitivity will be achieved once data becomes available from microcalorimeters with $\mathcal{O}({\rm a~few} \, \rm{eV})$ energy resolution.\nSuch microcalorimeters will be on board the Advanced Telescope for High ENergy Astrophysics (ATHENA), currently scheduled to launch in 2028.\nIts X-IFU instrument will have both large effective area, good imaging and energy resolution of $\sim 2.5 \rm{eV}$, greatly enhancing the discovery potential for ALPs.\n\nIn this paper we provide a first estimate for the experimental sensitivity of {\it Athena} to ALPs. We do so using simulated data for a mock observation of NGC~1275, hosting the radio source 3C~84, which contains the central AGN of the Perseus cluster.\nThis object was chosen as we have previously used it to place bounds on ALPs using {\it Chandra} data \cite{Berg:2016ese}.\n\n"
2,"\n\label{alps}\nAn ALP $a$ couples to electromagnetism through the Lagrangian term:\n\begin{equation}\n\label{ALPphoton}\n\qquad L = \frac{1}{4 M}~a~F_{\mu \nu} \tilde{F}^{\mu \nu} = \frac{1}{M}~a~{\bf E} \cdot {\bf B}~,\n\end{equation}\nwhere ${M^{-1} = g_{a\gamma\gamma}}$ parametrises the strength of the interaction,\nand ${\bf E}$ and ${\bf B}$ are the electric and magnetic fields.\nAs their potential and interactions are protected by shift symmetries, ALPs can naturally have very small masses $m_a$. The probability of ALP-photon interaction in the presence of an external magnetic field $\langle B \rangle$ is a standard result \cite{Sikivie:1983ip, Raffelt:1987im}. \n\nThe full analytic expression for the probability of an ALP being converted to a photon after propagating through a single magnetic field domain of length $L$ is:\n\begin{equation}\n\qquad P_{a \rightarrow \gamma} = \frac{1}{2}\frac{\Theta^2}{1 + \Theta^2}\sin^2 \left( \Delta \sqrt{1 + \Theta^2} \right),\n\end{equation}\nwhere\n\begin{equation}\n\qquad \Theta = 0.28 \Bigg(\frac{B_{\perp}}{1 \mu\rm{G}}\Bigg)\Bigg(\frac{\omega}{1 \, \rm{keV}}\Bigg)\Bigg(\frac{10^{-3} \rm{cm}^{-3}}{n_e}\Bigg)\Bigg(\frac{10^{11} \rm{GeV}}{M}\Bigg),\n\end{equation}\n\begin{equation}\n\qquad \Delta = 0.54 \Bigg(\frac{n_e}{10^{-3} \rm{cm}^{-3}}\Bigg)\Bigg(\frac{L}{10 \, \rm{kpc}}\Bigg)\Bigg(\frac{1 \rm{keV}}{\omega}\Bigg).\n\end{equation}\nHere $B_{\perp}$ denotes the magnetic field component perpendicular to the ALP wave vector, $\omega$ is the energy and $n_e$ is the electron density. In the limit $\Delta, \Theta \ll 1$, $P \propto B^2 L^2 / M^2$. However when $\Theta < 1$ but $\Delta > 1$, then\n$ P \propto \Theta^2 \sin^2 \Delta$.\nThis probability grows with energy, containing oscillations that are rapid at low energies and broader at higher energies. These\noscillations leave a distinctive imprint on otherwise featureless spectra, and their absence allows us to constrain $g_{a\gamma\gamma}$.\n\nThis photon-ALP interconversion is particularly efficient in galaxy clusters (e.g. see ~\cite{0902.2320,1305.3603}).\nClusters have ${\bf B}$ fields of order $\sim \mu$G which extend over megaparsec scales, within which the magnetic field coherence lengths reach tens of kiloparsecs.\nThe relatively low electron densities ($\sim 10^{-3}\rm{cm}^{-3}$) also implies that it is at X-ray energies that the `sweet spot' of large\n $\Delta$, small $\Theta$, and quasi-sinusoidal energy-dependent $P_{\gamma \leftrightarrow a}$ is located ~\cite{1304.0989, 1305.3603, 1312.3947, 1509.06748}.\n\nThe 3D structure of intracluster magnetic fields is in general not known and so\nthe precise form of the survival probability along any single line of sight cannot be determined. Figure~\ref{fig:ALPPhotonConversion} illustrates the energy-dependent survival probability for a photon passing across three hundred domains of a magnetic field, with the direction of the magnetic\nfield randomised within each domain. The electron density and magnetic field strength in\nthe model are based on those applicable in the Perseus cluster, but the pattern of smaller, rapid oscillations at low energies and slow oscillations with greater amplitude at high energies is generic.\n\nActive Galactic Nuclei (AGNs) situated in or behind galaxy clusters provide excellent X-ray sources to search for such spectral modulations. One outstanding example is the bright central AGN of the Perseus cluster, at the heart of the galaxy NGC~1275.\nIts intrinsic spectrum is well described by an absorbed power law \cite{Churazov:2003hr,Yamazaki, Balmaverde2006, Fabian:2015kua}, and dominates the background cluster emission. The central cluster magnetic field value is estimated at"
3,"$ \sim 25 \mu$G by \cite{0602622}.\n\nAn analysis of archival data of observations of NGC~1275 by the {\it Chandra} and {\it XMM-Newton} satellites was done in \cite{Berg:2016ese}\n(see \cite{1603.06978} for a related analysis of NGC~1275 in gamma rays).\nExtending methods pioneered in \cite{1304.0989}, the constraint on the ALP-photon coupling ${g_{a\gamma\gamma} \lesssim 1.5 \times 10^{-12}~{\rm GeV}^{-1}}$ was found. For M87, a similar treatment was performed in \cite{Marsh:2017yvc}, finding a\nbound ${g_{a\gamma\gamma} \lesssim 1.5 \times 10^{-12}~{\rm GeV}^{-1}}$. An analysis of {\it Chandra} data of other bright point sources in galaxy clusters was conducted in (\cite{Conlon:2017qcw}), deriving bounds of ${g_{a\gamma\gamma} \lesssim 1.5 \times 10^{-12}~{\rm GeV}^{-1}}$ (for the Seyfert galaxy 2E~3140) and ${g_{a\gamma\gamma} \lesssim 2.4 \times 10^{-12}~{\rm GeV}^{-1}}$ (for the AGN NGC~3862).\n\n%%{\bf These bounds are superior to those derived from SN 1987A, and are similar to IAXO in this low mass region. The absence of CMB distortions %\cite{Mirizzi:2009aj, Tashiro:2013yea} \n%%constrain the product $g B < 10^{-13} \text{GeV}^{-1} \text{nG}$, which are competitive with bounds from galaxy clusters if the cosmic magnetic field saturates the observed bound < nG. This is complementary to DM haloscopes searches.}\n\nThese bounds all hold for light ALPs with masses $m_a \lesssim 10^{-12} {\rm eV}$. This implies that these methods are not sensitive\nto an ordinary QCD axion, which for a photon couplings $g_{a\gamma\gamma} \sim 10^{-12} {\rm GeV}^{-1}$ would typically have $m_a \sim 10^{-3} {\rm eV}$. However, unconventional models for the QCD axion where the photon coupling is significantly enhanced compared to naive expectation may\nbe constrained using these techniques.\n\nThe bounds produced are superior to the bound on light ALPs derived from SN 1987A of $g_{a \gamma \gamma} < 5 \times 10^{-12} \text{GeV}^{-1}$ \cite{Payez:2014xsa}, and are similar to those projected for IAXO in this low mass region \cite{Irastorza:2012qf}. The bounds are also superior to those inferred from the absence of CMB distortions in \mbox{COBE FIRAS} data \cite{Mirizzi:2009nq}, which constrain the product $g_{a \gamma \gamma} B < 10^{-11} \text{GeV}^{-1} \text{nG}$. Here $B$ is the strength of the cosmic magnetic field, which is limited to $B<\text{nG}$.\n\nOne major limiting constraint on existing data is the energy resolution of the detectors.\nIf they exist, ALPs provide oscillatory structure all the way down to the lowest energies.\nHowever, as illustrated in Figure~\ref{fig:ALPPhotonConversion}, detectors with energy resolutions of $\mathcal{O}(100~\rm{eV})$ cannot resolve this structure at lower energies -- but this does become accessible once a resolution of $\mathcal{O}(2.5~\rm{eV})$ is achieved. We now discuss the future {\it Athena} X-ray observatory, whose greatly enhanced technical capabilities offer improved sensitivity to ALP-photon interconversion. \n\n"
4,"}\n\label{athena}\nThe Advanced Telescope for High ENergy Astrophysics (ATHENA) is an ESA mission to explore the Hot and Energetic Universe, due to launch in 2028 \cite{Nandra:2013shg}. The mirror will have a $2~\rm{m}^2$ effective area and a 5~arcsec angular resolution. There are two instruments: the X-ray Integral Field Unit (X-IFU) and the Wide Field Imager (WFI). Here we focus on the former, which will consist of an array of TiAu Transition Edge Sensor (TES) micro-calorimeters sensitive to the energy range 0.2--12~keV \cite{Barret:2016ett}. When operated at a temperature of 50 mK, these can achieve an energy resolution of 2.5~eV below 7~keV \cite{Gottardi:2016cdx}, implying X-IFU will be able to resolve narrow spectral oscillations. A readout time of $\sim10~\mu\rm{s}$ will ensure pileup contamination is minimised. Table~\ref{satellites} contains\na summary of its properties, taken from the {\it Athena} Mission Proposal\footnote{http://www.the-athena-x-ray-observatory.eu/images/AthenaPapers/ \\ The\_Athena\_Mission\_Proposal.pdf}, compared to properties of the {\it Chandra} ACIS-I detector, taken from the {\it Chandra} Proposer's Guide\footnote{http://cxc.harvard.edu/proposer/POG/html/chap6.html}.\n\n\begin{table}\n\n\centering\n\begin{tabular}{r|c|c}\n& {\it Athena} (X-IFU) & {\it Chandra} (ACIS-I)\\\n%& (X-IFU) & (ACIS-I)\\\n\hline\hline\nEnergy range & 0.2--12 keV & 0.3--10 keV\\ \hline\nEnergy resolution & 2.5 eV & 150 eV\\ \n at 6 keV & & \\ \hline\nSpatial resolution & 5 arcsec & 0.5 arcsec\\ \hline\nTime resolution & 10~$\mu$s & 0.2 s\\\n& & (2.8~ms single row)\\ \hline\nEffective area & 2~m$^2$ @ 1 keV & 600~cm$^2$ @ 1.5 keV \\ \hline\n\end{tabular}\n\caption{Parameters taken from the {\it Athena} Mission Proposal and the {\it Chandra} Proposer's Guide.}\n\label{satellites}\n\end{table}\n\nThe combination of larger effective area, greatly improved energy resolution and reduced pileup contamination means {\it Athena} has far more potential to detect ALP-induced oscillations than the best current satellites. The aim of this paper is\nto make the first quantitative estimate of the extent to which {\it Athena} will be able to improve constraints on\n$g_{a\gamma\gamma}$.\n\n"
...,...
1977,"$(\mathcal{G}')^{-1}$ is the inverse function of $\mathcal{G}'$.\n\nSo far we have discussed how theories of axions with various potentials can be constructed in field theory. For our purposes we also want to consider axion theories that -- in Einstein frame -- exhibit a non-canonical kinetic term. As we had not included gravity in our discussions of axions yet, there was no need to consider non-canonical kinetic terms, as one could always normalize. However, we will return to the question of non-canonical kinetic terms in the next sections, when we consider axions in supergravity and string theory. \n\nWhile considering axions as inflatons helps overcome many UV problems of inflation in effective field theory, one cannot remain completely agnostic about UV physics. For example, natural inflation needs $f \gtrsim m_p$, which seems to be an unnatural feature in the context of quantum gravity~\cite{ArkaniHamed:2006dz, 0605206, Conlon:2012tz}. Hence, in the following we will describe how axions and their properties can arise when the UV physics is given by string theory. As string theory models of axion inflation are typically formulated in the effective supergravity theory arising from string theory compactifications, we turn to axions in supergravity next.\n\n\subsubsection*{Axions in supergravity}\nAxions can be very naturally embedded in supergravity. They can be described by either the phase or the real or imaginary parts of complex scalar fields in supermultiplets. Consider for example a theory of a chiral superfield $\Phi$ described by:\n\begin{equation}\n\mathcal{K} \equiv \mathcal{K}\left(\Phi + \overline{\Phi}\right)\,, \quad W \equiv W_0 = \textrm{const} \, .\n\end{equation}\nAs $\mathcal{K}$ only depends on the combination $(\Phi + \overline{\Phi})$ and $W$ is independent of $\Phi$, the theory is symmetric under continuous shifts of $\textrm{Im}(\Phi)$, which we identify with the axion: $\phi \equiv \textrm{Im}(\Phi)$. \n\nTo generate a potential for the axion, the shift symmetry has to be broken. This can occur due to non-perturbative effects as in the non-supersymmetric case. To this end we introduce a non-Abelian gauge sector with its corresponding field strength superfield $\mathcal{W}^{\alpha}$. If we choose the corresponding gauge kinetic function to be $f=\Phi$, the axion $\phi$ will couple to the topological term of the non-Abelian gauge theory:\n\begin{equation}\n\label{gaugekin}\n{\left. \left( \Phi \ \text{tr} \, \mathcal{W}_{\alpha} \mathcal{W}^{\alpha} + \textrm{h.c.} \right) \right|}_{F} \supset -\phi \ \text{tr} \, F_{\mu \nu} \tilde{F}^{\mu \nu} \, .\n\end{equation}\nThen non-perturbative effects will introduce a periodic (Einstein-frame) potential for $\phi$ while at the same time breaking the continuous shift symmetry down to a discrete one. \n\nIn this paper we are also interested in the coupling between the axion and the topological term of an Abelian gauge theory. This will arise from a coupling of type~\eqref{gaugekin} where $\mathcal{W}^{\alpha}$ is now the field strength superfield of the Abelian gauge theory. \n\nOne can generate more general (i.e.~non-peridiodic) potentials for"
1978,"$\phi$ if the chiral superfield $\Phi$ appears in the superpotential explicitly, e.g.~$W = m h (\Phi)$ where $h$ is a holomorphic function. Then the shift symmetry of the axion is broken explicitly by $W$ (see however~\cite{0811.1989, 1101.0026}) and one may generate a polynomial Einstein-frame potential $V_E$. As $\mathcal{K}$ is still shift-symmetric, some of the axionic protections are still active. In particular, the breaking of the shift-symmetry is completely controlled by the parameter $m$. This is the ansatz for inflation models realizing $F$-term axion monodromy inflation~\cite{1404.3040, 1404.3542, 1404.3711}.\n\nFor our purposes we are particularly interested in theories where the axion kinetic term depends non-trivially on the axion itself. Given a K\""ahler potential $\mathcal{K}$ the function $K(\phi)$ appearing in~\eqref{non_minimal:einstein_frame} is given by $K \equiv \partial_{\Phi} \partial_{\overline{\Phi}} \mathcal{K}$. We can then make the following observation. If $\mathcal{K}$ preserves the axionic shift-symmetry, it only depends on the combination $(~\Phi~+~\overline{\Phi}~)$ and the function $K$ will only depend on the saxion $\textrm{Re}(\Phi)$, but not on the axion $\phi = \textrm{Im}(\Phi)$. Hence it seems that in supergravity we cannot get any non-trivial axion-dependence in $K$, without breaking the axionic shift-symmetry in $\mathcal{K}$.\footnote{This finding holds for all axions, i.e.~also for axions arising as phases or the real parts of complex scalars in chiral superfields. As long as $\mathcal{K}$ does not depend on the axion as required by shift-symmetry, there cannot be any axion-dependence in $K$.} \n\nIt is possible to break the shift-symmetry in the K\""ahler potential in different ways. One possibility is to introduce an explicit breaking term as in~\cite{Ferrara:2010yw,Ferrara:2010in,Buchmuller:2012ex}. In such a case, in order not to lose all the advantages deriving from the shift-symmetry, the amount of breaking has to be small. In particular, we can always include further fields in the theory. Hence, a possibility is to break the shift-symmetry through loop effects, as for example for theories whose superpotential $W \supset \kappa \Phi S_+ S_-$~\cite{Gaillard:1993es,Stewart:1996ey,Stewart:1997wg}, where $S_\pm$ are heavy fields. Upon integrating out $S_{\pm}$, axion-dependent loop corrections modify the \Kahler potential. The amount of shift-symmetry breaking is naturally small because loop-suppressed. \n\nFurthermore, it is important to observe that in supergravity we can never get a theory of just an axion. As the axion arises from a complex scalar, there will at least always be the saxion partner as an additional field. If we consider effective supergravity theories from string theory, the existence of further fields is rather generic. Note that these generically introduce an explicit axion-dependence in the axion kinetic term through backreaction. \n\nFinally, note that in the Peccei-Quinn mechanism the axion arises from a phase of a complex field, whereas here we focused on axions corresponding to the imaginary part of a complex scalar:"
1979,"$\phi= \text{Im}(\Phi)$. However, both descriptions are related. If the real part of a complex scalar is a scalar, then calling the imaginary part or the phase a pseudoscalar is equivalent (in both cases, a complex conjugation corresponds to a change in sign in the pseudoscalar part). An explicit connection between the two cases can be made as follows. In particular, let\n\begin{equation}\nf= \Phi \equiv \sigma + i \phi \, ,\n\end{equation}\nwith $\phi$ an axion and $\sigma$ denoting the scalar component (saxion). Then we can define\n\begin{equation}\n\Phi_{\textrm{PQ}} = e^{f} = e^{i \phi} (\cosh \sigma + \sinh \sigma) \, ,\n\end{equation}\nsuch that the axion now appears as a phase.\nHence the descriptions of an axion as a phase vs.~the imaginary part are equivalent descriptions related by a non-linear map.\n\n\subsubsection*{Axions from String Theory and Quantum Gravity Constraints}\n\nAxions are also a very natural prediction of string theory. They arise from the dimensional reduction of form field gauge potentials on sub-manifolds of the string theory compactification space. The shift-symmetry in the four-dimensional effective field theory is a remnant of the gauge symmetry of gauge fields in the ten-dimensional theory. In addition there are also universal axions (the axionic part of the axio-dilaton and the axions from dualizing to 2-form gauge potentials (see e.g.~\cite{1404.2601} for a brief review). It is even expected that string theory compactifications may give rise to a \textit{string axiverse}~\cite{Arvanitaki:2009fg, Cicoli:2012sz}. \n\nThere has been a sustained effort in the string theory community to embed inflation in string theory. Due to issues of theoretical control, models of inflation are typically constructed in a regime where an effective field theory description is applicable, rather than working in string theory directly. In particular, models are typically realized in the effective supergravity theory. There exists a multitude of proposed models of inflation in string theory (for a review until 2014 see~\cite{1404.2601}, for subsequent progress and references until September 2014 see~\cite{1409.5350}). However, most models come with open questions regarding control of quantum corrections, such that it is difficult to make robust predictions.\n\nHowever, there are certain properties which appear to be universal as far as embedding axion inflation in string theory is concerned. In particular, axions with a super-Planckian period ($f > m_p$) seem to be inconsistent with string theory compactifications~\cite{0605206}. This implies that the simplest models of natural inflation cannot arise from string theory. This is also consistent with general quantum gravity arguments~\cite{ArkaniHamed:2006dz, Conlon:2012tz}.\n\nThis does not imply that axion inflation in general is forbidden in string theory. However, to evade the constraints on the axion field range, models have to become more involved. The following mechanisms have been proposed to allow for inflation despite the constraint on the axion period:\n\begin{itemize}\n\item \textit{Alignment mechanisms}~\cite{Kim:2004rp}. The idea is to create a long super-Planckian inflaton trajectory in the field space of two or more sub-Planckian axions. It is necessary to tune the potential~\cite{Kim:2004rp} or to rely on kinetic terms~\cite{1404.7496, Shiu:2015xda} to create this long trajectory within a compact sub-Planckian field space. \n\item \textit{N-flation}~\cite{Dimopoulos:2005ac, Cicoli:2014sva, Das:2014gua}: This approach exploits the fact that a diagonal direction in the field space of"
1980,"$N$ axions can be super-Planckian for sufficiently large $N$, even if every single axion has a sub-Planckian field range.\n\item \textit{Axion monodromy}~\cite{Silverstein:2008sg, 0808.0706}: These models make use of an explicit breaking of the shift-symmetry (e.g.~due the presence of branes) in the spirit of~\cite{0507215, 0811.1989, 1101.0026} to generate a perturbative non-periodic potential for the axion. The originally periodic axion field space is effectively unfolded. \n\end{itemize}\nString theory compactifications contain all necessary `ingredients' for a successful embedding of any one of the above approaches: the existence of multiple axions is rather generic and D-branes and fluxes give rise to monodromies. Consequently, there exist many proposed models based on these ideas (see e.g.\cite{1409.5350} for a review until Sep.~2014). Yet, there are many open questions regarding the viability of any one model of axion inflation from string theory. Generalizations of the Weak Gravity Conjecture pose serious constraints on models based on alignment or N-flation~\cite{1503.00795, 1506.03447}. At the same time there are persistent problems with control as far as the stabilization of additional scalar fields (moduli) is concerned. Overall, at the time of writing there is no final verdict regarding axion inflation from string theory: While string theory exhibits many properties for successful axion inflation, there does not yet exist a model that withstands deeper scrutiny.\footnote{Models of axion inflation are typically models of large-field inflation which will give rise to measurable tensor modes. However, measurable tensor modes can also be generated in stringy inflation models that do not employ axions~\cite{Cicoli:2008gp, Burgess:2016owb, Cicoli:2016chb}. For such inflationary models explicit string theory embeddings have been built, including a controlled moduli stabilization procedure and the presence of a chiral visible sector~\cite{Cicoli:2016xae, ChiralGlobalFibre}.}\n\nWhat does this imply for the models of axion inflation considered in this work? In this paper we explore models that -- in Einstein frame -- exhibit a range of axion potentials, but also have non-canonical kinetic terms for the axion that depend on the axion itself. In addition, the axion should couple to the topological term associated with Abelian gauge theories. Overall, we find that string theory exhibits all the properties to accommodate the axion inflation models discussed in this work -- at least in principle. \n\begin{itemize}\n\item As far as the potential is concerned, models of axion inflation in string theory were shown to give rise to a wide range of possible potentials. The possibilities increase further once back-reaction of other scalar fields (moduli) is taken into account~\cite{1011.4521,1405.3652}. \n\item As the existence of moduli is a generic feature of string theory compactifications, back-reaction effects will typically play a role. As described in the section on supergravity, back-reaction effects can also induce axion-dependence of the kinetic terms. \n\item Furthermore, couplings between axions and the topological terms of (non-)Abelian gauge theories is generic in string theory. These couplings are a crucial ingredient for the cancellation of gauge anomalies in consistent string vacuums via the generalized Green-Schwarz mechanism.\footnote{In this case the gauge bosons receive string scale masses.} Interestingly, couplings of the form"


In [17]:
# Assume df_new_chunks is your DataFrame containing the chunks to translate
chunks_test = df_new_chunks['chunk'].head(10).tolist()  # Take the first 10 chunks for this example

chunk_responses = []

In [21]:
user_prompt_template = """
    Translate the following LaTeX content into plain text, adhering to these rules:
    - Convert \\section, \\subsection, \\abstract, \\chapter, etc., commands into plain text headings like Section, Subsection, Abstract, etc.
    - Keep mathematical equations as in LaTeX, enclosed in $ ... $, \\begin{{equation}} ... \\end{{equation}}, etc.
    - Turn \\begin{{itemize}} ... \\end{{itemize}}, \\begin{{enumerate}} ... \\end{{enumerate}} into bullet/numbered lists.
    - Enclose citations like \\cite{{cited_paper}} in square brackets: [cited_paper].
    - Remove all LaTeX commands that do not add information to the plain text.
    - If a chunk does not return meaningful plain text or equations, keep the output empty.

    LaTeX content to translate:
    {{chunk}}
"""

In [29]:
# Assuming `chunks_test` is your list of LaTeX chunks
for chunk in chunks_test:
    # Constructing messages as a list of dictionaries
    messages = [
        {"role": "system", "content": user_prompt_template},
        {"role": "user", "content": chunk}
    ]
    
    try:
        response = client.chat.completions.create(
            model="gpt-3.5-turbo-0125",
            messages=messages
            #temperature=0.5,
            #max_tokens=1024
        )

        # Correctly accessing the translated text from the response
        translated_text = response.choices[-1].message.content if response.choices else "No response"

        # Appending the LaTeX chunk and its translated text to the list
        chunk_responses.append({
            "LaTeX Code": chunk,
            "Translated Text": translated_text
        })
    except Exception as e:
        print(f"An error occurred: {e}")
        chunk_responses.append({
            "LaTeX Code": chunk,
            "Translated Text": "Error processing this chunk"
        })


In [34]:
chunk_responses

[{'LaTeX Code': '\\pdfoutput=1\n\\documentclass[fleqn,usenatbib,useAMS]{mnras}\n\\usepackage{newtxtext,newtxmath}\n\\usepackage{amsmath,amssymb}\n\\usepackage[T1]{fontenc}\n%\\usepackage{ae,aecompl}\n\\usepackage{natbib}\n\\usepackage{epsfig}\n\\usepackage{graphicx}\n\\usepackage{tablefootnote}\n%\\usepackage[export]{adjustbox}\n\\usepackage{floatrow}\n\\usepackage{caption}\n%\\usepackage{hyperref}\n\n\\newcommand{}{\\mathcal}\n\n\\title[Projected bounds on ALPs from ATHENA]{Projected bounds on ALPs from {\\it Athena}}\n\\author[J. P. Conlon et al.]{\nJoseph P. Conlon$^{1}$,\nFrancesca Day$^{1}$, \nNicholas Jennings$^{1}$\\thanks{E-mail: nicholas.jennings@physics.ox.ac.uk}, \nSven Krippendorf$^{1}$\n\\newauthor{ and Francesco Muia$^{1}$}\n\\\\\n% List of institutions\n$^{1}$Rudolf Peierls Centre for Theoretical Physics, 1 Keble Road, Oxford, OX1 3NP, UK\\\\\n}\n\\date{\\today}\n\n\\pubyear{2017}\n\n\\begin{document}\n\\label{firstpage}\n\\pagerange{\\pageref{firstpage}--\\pageref{lastp

In [33]:
# Creating a DataFrame from the responses
df_translations = pd.DataFrame(chunk_responses)
display(df_translations)

Unnamed: 0,LaTeX Code,Translated Text
0,"\pdfoutput=1\n\documentclass[fleqn,usenatbib,useAMS]{mnras}\n\usepackage{newtxtext,newtxmath}\n\usepackage{amsmath,amssymb}\n\usepackage[T1]{fontenc}\n%\usepackage{ae,aecompl}\n\usepackage{natbib}\n\usepackage{epsfig}\n\usepackage{graphicx}\n\usepackage{tablefootnote}\n%\usepackage[export]{adjustbox}\n\usepackage{floatrow}\n\usepackage{caption}\n%\usepackage{hyperref}\n\n\newcommand{}{\mathcal}\n\n\title[Projected bounds on ALPs from ATHENA]{Projected bounds on ALPs from {\it Athena}}\n\author[J. P. Conlon et al.]{\nJoseph P. Conlon$^{1}$,\nFrancesca Day$^{1}$, \nNicholas Jennings$^{1}$\thanks{E-mail: nicholas.jennings@physics.ox.ac.uk}, \nSven Krippendorf$^{1}$\n\newauthor{ and Francesco Muia$^{1}$}\n\\\n% List of institutions\n$^{1}$Rudolf Peierls Centre for Theoretical Physics, 1 Keble Road, Oxford, OX1 3NP, UK\\\n}\n\date{\today}\n\n\pubyear{2017}\n\n\begin{document}\n\label{firstpage}\n\pagerange{\pageref{firstpage}--\pageref{lastpage}}\n\maketitle\n\n\begin{abstract}\nGalaxy clusters represent excellent laboratories to search for Axion-Like Particles (ALPs). They contain magnetic fields which can induce quasi-sinusoidal oscillations in the X-ray spectra of AGNs situated in or behind them. Due to its excellent \nenergy resolution, the X-ray Integral Field Unit (X-IFU) instrument onboard the {\it Athena} X-ray Observatory will be far more sensitive to ALP-induced modulations than current detectors. As a first analysis of the sensitivity of {\it Athena} to the ALP-photon coupling $g_{a \gamma \gamma}$, we simulate observations of the Seyfert galaxy NGC~1275 (hosting the radio source 3C~84) in the Perseus cluster using the SIXTE simulation software. We estimate that for a 200~ks exposure, a non-observation of spectral modulations will constrain ${g_{a\gamma\gamma}\lesssim1.5\times10^{-13}~\rm{GeV}^{-1}}$ for $m_a\lesssim10^{-12}~\rm{eV}$, representing an order of magnitude improvement over constraints derived using the current generation of satellites.\n\end{abstract}\n\n\begin{keywords}\nastroparticle physics -- elementary particles -- galaxies: clusters: individual: Perseus\n\end{keywords}\n\n",Error processing this chunk
1,"\n\label{introduction}\nX-ray astronomy provides a novel arena for fundamental physics. Thanks to exciting recent data, such as the observed excess at 3.5~keV \cite{Bulbul, Boyarsky}, there has been a renewed interest among particle physicists in the great promise of X-ray astronomy to shed light on physics beyond the Standard Model, including the existence of new particles.\n\nOne area for which X-ray astronomy is particularly suitable\n is in the search for Axion-Like Particles (ALPs).\nALPs are light pseudo-scalars that are a well motivated extension of the Standard Model \cite{PecceiQuinn,Wilczek,Weinberg} that arise\n generically in string compactifications, for example see \cite{hep-th/0602233,hep-th/0605206,1206.0819}. A general review of ALPs is \cite{RingwaldReview}. In the presence of a magnetic field $\langle B \rangle$ ALPs and photons interconvert \cite{Sikivie:1983ip, Raffelt:1987im}, and this induces quasi-sinusoidal oscillations at X-ray energies in the spectra of sources in and around galaxy clusters \cite{1304.0989, 1509.06748}.\n\nSearches for these oscillations can be used to constrain ALP parameter space.\nCurrent constraints on ALPs derived in this fashion \cite{1304.0989, Berg:2016ese, Marsh:2017yvc,Conlon:2017qcw} are based on data taken with CCD detectors, which have an energy resolution of $\mathcal{O}(100~\rm{eV})$. A large improvement with sensitivity will be achieved once data becomes available from microcalorimeters with $\mathcal{O}({\rm a~few} \, \rm{eV})$ energy resolution.\nSuch microcalorimeters will be on board the Advanced Telescope for High ENergy Astrophysics (ATHENA), currently scheduled to launch in 2028.\nIts X-IFU instrument will have both large effective area, good imaging and energy resolution of $\sim 2.5 \rm{eV}$, greatly enhancing the discovery potential for ALPs.\n\nIn this paper we provide a first estimate for the experimental sensitivity of {\it Athena} to ALPs. We do so using simulated data for a mock observation of NGC~1275, hosting the radio source 3C~84, which contains the central AGN of the Perseus cluster.\nThis object was chosen as we have previously used it to place bounds on ALPs using {\it Chandra} data \cite{Berg:2016ese}.\n\n",Error processing this chunk
2,"\n\label{alps}\nAn ALP $a$ couples to electromagnetism through the Lagrangian term:\n\begin{equation}\n\label{ALPphoton}\n\qquad L = \frac{1}{4 M}~a~F_{\mu \nu} \tilde{F}^{\mu \nu} = \frac{1}{M}~a~{\bf E} \cdot {\bf B}~,\n\end{equation}\nwhere ${M^{-1} = g_{a\gamma\gamma}}$ parametrises the strength of the interaction,\nand ${\bf E}$ and ${\bf B}$ are the electric and magnetic fields.\nAs their potential and interactions are protected by shift symmetries, ALPs can naturally have very small masses $m_a$. The probability of ALP-photon interaction in the presence of an external magnetic field $\langle B \rangle$ is a standard result \cite{Sikivie:1983ip, Raffelt:1987im}. \n\nThe full analytic expression for the probability of an ALP being converted to a photon after propagating through a single magnetic field domain of length $L$ is:\n\begin{equation}\n\qquad P_{a \rightarrow \gamma} = \frac{1}{2}\frac{\Theta^2}{1 + \Theta^2}\sin^2 \left( \Delta \sqrt{1 + \Theta^2} \right),\n\end{equation}\nwhere\n\begin{equation}\n\qquad \Theta = 0.28 \Bigg(\frac{B_{\perp}}{1 \mu\rm{G}}\Bigg)\Bigg(\frac{\omega}{1 \, \rm{keV}}\Bigg)\Bigg(\frac{10^{-3} \rm{cm}^{-3}}{n_e}\Bigg)\Bigg(\frac{10^{11} \rm{GeV}}{M}\Bigg),\n\end{equation}\n\begin{equation}\n\qquad \Delta = 0.54 \Bigg(\frac{n_e}{10^{-3} \rm{cm}^{-3}}\Bigg)\Bigg(\frac{L}{10 \, \rm{kpc}}\Bigg)\Bigg(\frac{1 \rm{keV}}{\omega}\Bigg).\n\end{equation}\nHere $B_{\perp}$ denotes the magnetic field component perpendicular to the ALP wave vector, $\omega$ is the energy and $n_e$ is the electron density. In the limit $\Delta, \Theta \ll 1$, $P \propto B^2 L^2 / M^2$. However when $\Theta < 1$ but $\Delta > 1$, then\n$ P \propto \Theta^2 \sin^2 \Delta$.\nThis probability grows with energy, containing oscillations that are rapid at low energies and broader at higher energies. These\noscillations leave a distinctive imprint on otherwise featureless spectra, and their absence allows us to constrain $g_{a\gamma\gamma}$.\n\nThis photon-ALP interconversion is particularly efficient in galaxy clusters (e.g. see ~\cite{0902.2320,1305.3603}).\nClusters have ${\bf B}$ fields of order $\sim \mu$G which extend over megaparsec scales, within which the magnetic field coherence lengths reach tens of kiloparsecs.\nThe relatively low electron densities ($\sim 10^{-3}\rm{cm}^{-3}$) also implies that it is at X-ray energies that the `sweet spot' of large\n $\Delta$, small $\Theta$, and quasi-sinusoidal energy-dependent $P_{\gamma \leftrightarrow a}$ is located ~\cite{1304.0989, 1305.3603, 1312.3947, 1509.06748}.\n\nThe 3D structure of intracluster magnetic fields is in general not known and so\nthe precise form of the survival probability along any single line of sight cannot be determined. Figure~\ref{fig:ALPPhotonConversion} illustrates the energy-dependent survival probability for a photon passing across three hundred domains of a magnetic field, with the direction of the magnetic\nfield randomised within each domain. The electron density and magnetic field strength in\nthe model are based on those applicable in the Perseus cluster, but the pattern of smaller, rapid oscillations at low energies and slow oscillations with greater amplitude at high energies is generic.\n\nActive Galactic Nuclei (AGNs) situated in or behind galaxy clusters provide excellent X-ray sources to search for such spectral modulations. One outstanding example is the bright central AGN of the Perseus cluster, at the heart of the galaxy NGC~1275.\nIts intrinsic spectrum is well described by an absorbed power law \cite{Churazov:2003hr,Yamazaki, Balmaverde2006, Fabian:2015kua}, and dominates the background cluster emission. The central cluster magnetic field value is estimated at",Error processing this chunk
3,"$ \sim 25 \mu$G by \cite{0602622}.\n\nAn analysis of archival data of observations of NGC~1275 by the {\it Chandra} and {\it XMM-Newton} satellites was done in \cite{Berg:2016ese}\n(see \cite{1603.06978} for a related analysis of NGC~1275 in gamma rays).\nExtending methods pioneered in \cite{1304.0989}, the constraint on the ALP-photon coupling ${g_{a\gamma\gamma} \lesssim 1.5 \times 10^{-12}~{\rm GeV}^{-1}}$ was found. For M87, a similar treatment was performed in \cite{Marsh:2017yvc}, finding a\nbound ${g_{a\gamma\gamma} \lesssim 1.5 \times 10^{-12}~{\rm GeV}^{-1}}$. An analysis of {\it Chandra} data of other bright point sources in galaxy clusters was conducted in (\cite{Conlon:2017qcw}), deriving bounds of ${g_{a\gamma\gamma} \lesssim 1.5 \times 10^{-12}~{\rm GeV}^{-1}}$ (for the Seyfert galaxy 2E~3140) and ${g_{a\gamma\gamma} \lesssim 2.4 \times 10^{-12}~{\rm GeV}^{-1}}$ (for the AGN NGC~3862).\n\n%%{\bf These bounds are superior to those derived from SN 1987A, and are similar to IAXO in this low mass region. The absence of CMB distortions %\cite{Mirizzi:2009aj, Tashiro:2013yea} \n%%constrain the product $g B < 10^{-13} \text{GeV}^{-1} \text{nG}$, which are competitive with bounds from galaxy clusters if the cosmic magnetic field saturates the observed bound < nG. This is complementary to DM haloscopes searches.}\n\nThese bounds all hold for light ALPs with masses $m_a \lesssim 10^{-12} {\rm eV}$. This implies that these methods are not sensitive\nto an ordinary QCD axion, which for a photon couplings $g_{a\gamma\gamma} \sim 10^{-12} {\rm GeV}^{-1}$ would typically have $m_a \sim 10^{-3} {\rm eV}$. However, unconventional models for the QCD axion where the photon coupling is significantly enhanced compared to naive expectation may\nbe constrained using these techniques.\n\nThe bounds produced are superior to the bound on light ALPs derived from SN 1987A of $g_{a \gamma \gamma} < 5 \times 10^{-12} \text{GeV}^{-1}$ \cite{Payez:2014xsa}, and are similar to those projected for IAXO in this low mass region \cite{Irastorza:2012qf}. The bounds are also superior to those inferred from the absence of CMB distortions in \mbox{COBE FIRAS} data \cite{Mirizzi:2009nq}, which constrain the product $g_{a \gamma \gamma} B < 10^{-11} \text{GeV}^{-1} \text{nG}$. Here $B$ is the strength of the cosmic magnetic field, which is limited to $B<\text{nG}$.\n\nOne major limiting constraint on existing data is the energy resolution of the detectors.\nIf they exist, ALPs provide oscillatory structure all the way down to the lowest energies.\nHowever, as illustrated in Figure~\ref{fig:ALPPhotonConversion}, detectors with energy resolutions of $\mathcal{O}(100~\rm{eV})$ cannot resolve this structure at lower energies -- but this does become accessible once a resolution of $\mathcal{O}(2.5~\rm{eV})$ is achieved. We now discuss the future {\it Athena} X-ray observatory, whose greatly enhanced technical capabilities offer improved sensitivity to ALP-photon interconversion. \n\n",Error processing this chunk
4,"}\n\label{athena}\nThe Advanced Telescope for High ENergy Astrophysics (ATHENA) is an ESA mission to explore the Hot and Energetic Universe, due to launch in 2028 \cite{Nandra:2013shg}. The mirror will have a $2~\rm{m}^2$ effective area and a 5~arcsec angular resolution. There are two instruments: the X-ray Integral Field Unit (X-IFU) and the Wide Field Imager (WFI). Here we focus on the former, which will consist of an array of TiAu Transition Edge Sensor (TES) micro-calorimeters sensitive to the energy range 0.2--12~keV \cite{Barret:2016ett}. When operated at a temperature of 50 mK, these can achieve an energy resolution of 2.5~eV below 7~keV \cite{Gottardi:2016cdx}, implying X-IFU will be able to resolve narrow spectral oscillations. A readout time of $\sim10~\mu\rm{s}$ will ensure pileup contamination is minimised. Table~\ref{satellites} contains\na summary of its properties, taken from the {\it Athena} Mission Proposal\footnote{http://www.the-athena-x-ray-observatory.eu/images/AthenaPapers/ \\ The\_Athena\_Mission\_Proposal.pdf}, compared to properties of the {\it Chandra} ACIS-I detector, taken from the {\it Chandra} Proposer's Guide\footnote{http://cxc.harvard.edu/proposer/POG/html/chap6.html}.\n\n\begin{table}\n\n\centering\n\begin{tabular}{r|c|c}\n& {\it Athena} (X-IFU) & {\it Chandra} (ACIS-I)\\\n%& (X-IFU) & (ACIS-I)\\\n\hline\hline\nEnergy range & 0.2--12 keV & 0.3--10 keV\\ \hline\nEnergy resolution & 2.5 eV & 150 eV\\ \n at 6 keV & & \\ \hline\nSpatial resolution & 5 arcsec & 0.5 arcsec\\ \hline\nTime resolution & 10~$\mu$s & 0.2 s\\\n& & (2.8~ms single row)\\ \hline\nEffective area & 2~m$^2$ @ 1 keV & 600~cm$^2$ @ 1.5 keV \\ \hline\n\end{tabular}\n\caption{Parameters taken from the {\it Athena} Mission Proposal and the {\it Chandra} Proposer's Guide.}\n\label{satellites}\n\end{table}\n\nThe combination of larger effective area, greatly improved energy resolution and reduced pileup contamination means {\it Athena} has far more potential to detect ALP-induced oscillations than the best current satellites. The aim of this paper is\nto make the first quantitative estimate of the extent to which {\it Athena} will be able to improve constraints on\n$g_{a\gamma\gamma}$.\n\n",Error processing this chunk
5,"\n\label{bounds}\nIn terms of estimating bounds on $g_{a\gamma\gamma}$ we use the same method as previously applied with\n{\it Chandra} data \cite{Berg:2016ese}. This allows for a direct comparison\nbetween the capabilities of {\it Chandra} and {\it Athena} in terms of placing bounds.\n\nWe simulate {\it Athena} observations of NGC~1275, using two models for the photon spectra of the AGN.\nThe first is a standard spectrum without ALPs, and the second is a model with the same spectrum multiplied with the\nphoton survival probability distribution as introduced in Section~\ref{alps}. Using simulations of the\nX-IFU detector response, we fit spectra generated assuming ALP-photon conversion with the model without ALPs (Model 0) and then we compare this fit to the fit of the spectrum generated without ALPs to the same model.\nTo allow for the uncertainty in the\nmagnetic field configuration along the line of sight, we repeat this analysis using many different randomly generated magnetic fields.\n\nThe two photon spectra that we model are:\n\begin{enumerate}\n\item Model 0: An absorbed power law plus thermal background:\n\begin{equation}\n\qquad F_{0}(E) = (A E^ {- \gamma} + \mathtt{BAPEC}) \times e^{-n_{H} \sigma(E,z)},\n\end{equation}\nwhere $A$ and $\gamma$ are the amplitude and index of the power law, $E$ is the energy, $n_H$ is the equivalent hydrogen column, $\sigma(E, z)$ is the photo-electric cross-section at redshift $z$, and $\mathtt{BAPEC}$ is the standard plasma thermal emission model.\n\item Model 1: An absorbed power law plus thermal background, multiplied by a table of survival probabilities for photons of different energies:\n\begin{equation}\nF_{1}(E, {\bf B}) = (A E^ {- \gamma} + \mathtt{BAPEC}) \times e^{-n_{H} \sigma(E,z)} \times P_{\gamma \to \gamma} (E (1 + z), { \bf B}, g_{a \gamma \gamma})~.\n\end{equation}\n\end{enumerate}\nThe index of the power law was set based on the best fit value from the cleanest {\it Chandra} observations of NGC~1275, and its normalisation was determined based on the {\it Hitomi} 230~ks observation of Perseus in 2016 \cite{Aharonian:2016gzq}. As the AGN in 2016 was\nroughly twice as bright as in 2009 and it has previously exhibited large historical variation \cite{Fabian:2015kua}, it may be again much brighter (or dimmer) in 2028, which would affect both the contrast\nagainst the cluster background and also the observation time required to achieve a certain constraint on $g_{a \gamma \gamma}$.\n\nThe 2016 {\it Hitomi} observation also constrained the temperature, abundances and velocity dispersion of the cluster thermal emission to a high degree of accuracy \cite{Aharonian:2016gzq}.\nFor the spectral shape of the cluster background, we used the single-temperature $\mathtt{bapec}$ model that was a good fit\nto the {\it Hitomi} spectrum across its field of view. While this single-temperature model is unlikely to be a good fit for the background\ncontiguous to the AGN, it represents a useful proxy for the actual background that can only be determined at the time.\nThe normalisation of the background was set by extracting a circular region\nof the cluster emission close to the AGN from the {\it Chandra} observations, of radius equal to the angular resolution of {\it Athena}, and determining the best fit. All model parameters are shown in Table \ref{parameters}.\n\begin{table}\n\centering\n\begin{tabular}{l|l|c|c}\nModel & parameter & symbol & value\\ \hline \hline\n",Error processing this chunk
6,"$\mathtt{zwabs}$ & nH column density & $n_H$ & $0.24 \times 10^{22} \rm{cm}^{-2}$\\\n & redshift & z & 0.0176\\ \hline\n$\mathtt{powerlaw}$ & index & $\gamma$ & 1.8\\\n & normalisation & A & $9 \times 10^{-3}$\\ \hline\n$\mathtt{bapec}$ & temperature & kT & 3.48 keV\\\n & abundances & & 0.54 solar\\\n & velocity dispersion & v & 178 m \,${\rm s}^{-1}$\\\n& normalisation & N & $9 \times 10^{-4}$\n\end{tabular}\n\caption{Parameters of the absorbed power law describing the spectrum of NGC~1275, and the thermal model of the cluster background.}\n\label{parameters}\n\end{table}\n\nAs for the study with {\it Chandra}, we take the central magnetic field value as $B_0\sim 25\mu $G, following \cite{0602622}. We also\nassume that $B$ decreases with radius as $B \propto n_{e}^{0.7}$.\nAs there is not a direct measurement of the power spectrum and coherence length for the Perseus magnetic field, we base the model on those inferred for the cool core cluster A2199 \cite{Vacca:2012up}.\n\nThe electron density $n_{e}$ has the radial distribution found in \cite{Churazov:2003hr}:\n\begin{equation}\n\qquad n_{e} (r) = \frac{3.9 \times 10^{-2}}{ [ 1 + (\frac{r}{80 \, {\rm kpc}})^2]^{1.8}} + \frac{4.05 \times 10^{-3}}{ [ 1 + (\frac{r}{280 \, {\rm kpc}})^2]^{0.87}} \, {\rm cm}^{-3}.\n\end{equation}\n\nThe magnetic field is generated over 300 domains, whose lengths are drawn from a Pareto distribution between $3.5~\rm{kpc}$ and $10~\rm{kpc}$ with power 2.8. In each domain the magnetic field and electron density are constant, with a random direction of ${\bf B}$. We then\ncalculate the survival probability of a photon passing through this region, as described in \cite{1312.3947}.\n\nThe simulations were performed using the Simulation of X-ray Telescopes ($\mathtt{SIXTE}$) code, a multi-instrument simulation package. It aims to offer an end-to-end simulation, i.e. the full detector chain from the source to the final data. It models the telescope's vignetting, ARF and PSF, and X-IFU's response, event reconstruction and pileup \cite{2014SPIE.9144E..5XW}.\n\nThe spectrum of NGC~1275, and the cluster background, were modelled in $\mathtt{XSPEC}$\footnote{https://heasarc.gsfc.nasa.gov/xanadu/xspec/manual/manual.html} as an absorbed power law plus a thermal component, $\mathtt{zwabs*(powerlaw + bapec)}$. This spectrum, either multiplied with the photon survival probabilities or not, was converted to the SIMPUT\footnote{http://hea-www.harvard.edu/heasarc/formats/simput-1.0.0.pdf} file format using the command $\mathtt{simputfile}$. The mirror and detector response were modelled with $\mathtt{xifupipeline}$, using the ARF file $\mathtt{athena\_xifu\_1469\_onaxis\_pitch249um\_v20160401.arf}$ and the RMF file $\mathtt{athena\_xifu\_rmf\_v20160401.rmf}$. This generated an event FITS file, which was then converted into a PHA file using $\mathtt{makespec}$. We produced a fit to this spectrum in $\mathtt{XSPEC}$, using the Levenberg-Marquardt fitting method to calculate the reduced $\chi^2$. Figure~\ref{spectrum} shows one simulation for",Error processing this chunk
7,"${g_{a \gamma \gamma} = 3 \times 10^{-13} {\rm GeV}^{-1}}$ and its fit to an absorbed power law.\n\n\n\nWe use the following procedure to determine whether a particular value of $g_{a \gamma \gamma}$ is excluded: we varied the ALP-photon coupling $g_{a \gamma \gamma}$ from $g_{a \gamma \gamma} = 5 \times 10^{-13} \, \text{GeV}^{-1}$ to $g_{a \gamma \gamma} = 1\times 10^{-13} \, \text{GeV}^{-1}$, with stepsize $0.5 \times 10^{-13} \, \text{GeV}^{-1}$. As the bound is dependent on uncertainties in the magnetic field strength of a factor of 2, and we are only using simulated data, we do not consider step sizes smaller than this. For each $g_{a \gamma \gamma}$:\n\begin{enumerate}\n\item Generate 50 configurations of the magnetic field $B_i$.\n\item Use the $B_i$ to calculate the survival probability $P_{\gamma \rightarrow \gamma}$ along the line of sight for different photon energies (as done in \cite{1312.3947}). We calculate for 8000 equally spaced photon energies in the range 0.01--10~keV.\n\item Combine each $P_{\gamma \rightarrow \gamma}$ with the AGN spectrum.\n\item Generate 10 fake PHAs for each spectrum, providing 500 fake data samples in total.\n\item Fit the fake data to Model 0, and calculate the reduced chi-squareds $\chi_1^2$.\n\item Generate 100 fake PHAs based on Model 0, and compute the average of their reduced chi-squareds $\chi_0^2$.\nAssuming the absence of ALPs, this represents the expected quality of the fit to the single real data set. If the actual data is a poor fit\nfor some reason, then this will weaken the level of the resulting bounds that we can produce.\n\item Determine the percentage of fake data sets that have a reduced chi-squared $\chi_1^2 < \rm{max}(\langle \chi_0^2 \rangle,1)$. If this is true for fewer than 5 per cent of the data sets, the value of $g_{a \gamma \gamma}$ is excluded at 95 per cent confidence.\n\end{enumerate}\n\nFor a simulation of 200~ks of data with the nominal mirror configuration, we derive a projected\nbound of ${g_{a\gamma\gamma} \lesssim 1.5 \times 10^{-13}~ \rm{GeV}^{-1}}$ at 95 per cent confidence and of ${g_{a\gamma\gamma} \lesssim 2.5 \times 10^{-13}~ \rm{GeV}^{-1}}$ at 99\% confidence, as shown in Fig.~\ref{fig:ExclusionLimit} alongside published data limits. This represents an order of magnitude improvement over the bound derived from the 200~ks of Chandra ACIS-I observations in \cite{Berg:2016ese}. We also find that even\na short 10~ks observation will lead to an improved bound of ${g_{a\gamma\gamma} \lesssim 4.5 \times 10^{-13}~ \rm{GeV}^{-1}}$.\n\nThese bounds are substantially better than any current experimental or astrophysical bound, and also go beyond the capabilities of IAXO for ultralight ALP masses. The proposed DM haloscope ABRACADABRA has the potential to explore $g_{a \gamma \gamma}$ down to $10^{-17} \text{GeV}^{-1}$ for $m_a \in [10^{-14},10^{-6}] \text{eV}$ \cite{Kahn:2016aff}, if ALPs constitute the Dark Matter. The existence of ALP-induced oscillations in galaxy clusters is independent of this. Proposed CMB experiments such as PIXIE \cite{Kogut:2011xw} and PRISM \cite{Andre:2013afa} could produce a constraint",Error processing this chunk
8,"$g_{a \gamma \gamma} B < 10^{-16} \text{GeV}^{-1} \text{nG}$ which might be competitive with bounds from galaxy clusters if the cosmic magnetic field is close enough to saturation $\sim \text{nG}$ \cite{Tashiro:2013yea}. Black hole superradiance also offers tentative constraints ALPs on in the mass range $m_a \in [10^{-14},10^{-10}] \text{eV}$, depending on measurements of black hole spin \cite{Arvanitaki:2016qwi}. \n\n\n",Error processing this chunk
9,"\n\label{conclusion}\nAGNs situated in galaxy clusters are excellent targets to search for ALP-photon interconversion. {\it Athena}'s groundbreaking new technology will be able to resolve AGN spectra very precisely. The bound ${g_{a\gamma\gamma} \lesssim 1.5 \times 10^{-13}~ \rm{GeV}^{-1}}$ derived from simulations of 200~ks observations is an order of magnitude improvement over the bounds from current generation satellites. For the mass range ${m_a \lesssim 10^{-12}~\rm{eV}}$, it will also be far better than the bounds obtainable from future experimental searches such as IAXO.\n\n\nWe stress that this is only a first estimate of the sensitivity of {\it Athena} to ALP-induced modulations. The final sensitivity will depend on the capabilities of the finished satellite, the brightness of the AGN in 2028 and the quality of the actual data.\nTelescopes such as the Square Kilometre Array (SKA) are likely to reduce the uncertainties in the magnetic field model \cite{Braun:2015zta}, allowing for greater precision in $g_{a \gamma \gamma}$ bounds calculations by the time {\it Athena} launches. However, we have demonstrated that {\it Athena} will certainly improve bounds on $g_{a \gamma \gamma}$ substantively, and that X-ray astronomy will continue to be at the forefront of ultralight ALP searches in the coming decades.\n\n\n\section*{Acknowledgements}\n\nThis project is funded in part by the European Research Council starting grant `Supersymmetry Breaking in String Theory' (307605). Both Francesca Day and Nicholas Jennings are also funded by STFC.\\\n\bsp\n\bibliographystyle{mnras}\n\bibliography{Athenabib}\n\n\label{lastpage}\n\end{document}\n\n\documentclass[a4paper,11pt]{article}\n\n\n\usepackage[a4paper,\n left=2.5cm, right=2.5cm,\n top= 3cm, bottom=4cm]{geometry}\n\usepackage{amsmath}\n\usepackage{oldgerm}\n\usepackage{amssymb}\n\usepackage{bbm}\n\usepackage[dvips]{graphicx}\n\usepackage{epsfig}\n\usepackage{color} \n\usepackage{cite}\n\usepackage{epic}\n\usepackage{hyperref}\n\n\n%\setlength{\parindent}{0pt}\n\n\usepackage{empheq}\n\n\newcommand*\widefbox[1]{\fbox{\hspace{2em}#1\hspace{2em}}}\n\n\n%\usepackage{amsmath}\n\n\numberwithin{equation}{section}\n\n\usepackage[utf8]{inputenc}\n\n\usepackage{graphicx}\n\usepackage{mathrsfs}\n\usepackage{amsmath}\n\usepackage{amssymb}\n\usepackage{braket} \n\usepackage{hyperref}\n\usepackage{frontespizio}\n\usepackage{comment}\n\usepackage{epsfig}\n\usepackage{float}\n\usepackage{color}\n\usepackage[title]{appendix}\n\usepackage{multirow}\n%\usepackage{slashbox}\n\usepackage{tikz}\n\usetikzlibrary{decorations.pathmorphing}\n\usepackage{varwidth}\n\usepackage{tikz}\n\usetikzlibrary{backgrounds,patterns,calc}\n\usepackage{xparse}\n%\usepackage{subfigure}\n\usepackage{caption}\n\captionsetup{belowskip=-20pt}\n%\usepackage{showlabels}\n\n\usepackage{enumitem}\n\setlist[itemize]{leftmargin=*}\n\n\usetikzlibrary{decorations.pathmorphing}\n\n\tikzset{zigzag/.style={decorate, decoration=zigzag}}\n\def \L {2.}\n\n\newcommand{\cite}{\cite}\n\n\newcommand{\begin{eqnarray}}{\begin{eqnarray}}\n\newcommand{\end{eqnarray}}{\end{eqnarray}}\n\newcommand{",Error processing this chunk


### Upload file

In [139]:
#name_file = "1903.06239/Review.tex" # Palti's review
#name_file = "2008.10625/ls.tex" # Hebecker's review
#name_file = "2303.04819/Sections/Introduction.tex" # StringCosmo review. The sections are: Introduction, CosmoOverview, Moduli, Inflation, Postinflation, DarkEnergy, Alternatives, Outlook
#name_file = "2310.20559/ls.tex" # McAllister-Quevedo's review
name_file = "0701050/review.tex" # Denef-Douglas-Kachru's review

latex_file_path = 'Files/' + name_file

# Extract the LaTeX content
latex_content = extract_latex_content(latex_file_path, "\\startdocument", "\\enddocument")

len(latex_content)

76800

### Simplify the latex text using common replacements

In [140]:
replacements = {
        r'\\d': 'd',
        r'\\G': 'G',
        r'\\O': 'O',
        r'\\C': 'C',
        r'\\V': 'V',
        r'\\L': 'L',
        r'\\R': 'R',
        r'\\S': 'S',
        r'\\Mp': 'Mp',
        r'\\cN': 'N',
        r'\\cC': 'C',
        r'\\cP': 'P',
        r'\\cR': 'R',
        r'\\vo': 'V',
        r'\\Kahler': 'Kahler',
        r'\\flux': 'flux',
        r'\\KK': 'Kaluza-Klein',
        r'\\n': ' '
    }                                        # This can be improved adding more replacements

brace_commands = [r'\\emph', r'\\footnote', r'\\it', r'\\em', r'\\ref', r'\\eqref']               # This can be improved adding more replacements

simplified_text = replace_latex_commands(latex_content, replacements, brace_commands)
len(simplified_text)

76552

### Polish latex text removing standard latex commands

In [141]:
polished_text = clean_latex_content(simplified_text)         # This can be improved adding more commands
len(polished_text)

75561

### Split the text in chunks

In [143]:
no_char_in_chunk = 2000

chunks = chunk_text(polished_text, no_char_in_chunk)
chunks = [chunk.replace("%", "") for chunk in chunks]
print("The number of chunks is: " + str(len(chunks)) + ".")
chunks[23:25]

The number of chunks is: 45.


["The number of vacua $\\phi_*$ in an interval $I$ is given by \\begin{equation}\n\\label{ansatz}\nds^2 = g_{\\mu u} dx^{\\mu}dx^{ u} + R^2 \\tilde g_{mn}dy^m dy^n\n\\end{equation}6 where $\\theta(x):=1$ if $x>0$, $\\theta(x):=0$ if $x<0$. The integrand $delta(V') |V''|$ gives a contribution $+1$ for each critical point in $I$, while $\\theta(V'')$ restricts to actual minima. Now in the large $L$ limit, we can approximate the sum over $(N,M)$ by an integral, and write \\begin{equation}\n\\label{ansatz}\nds^2 = g_{\\mu u} dx^{\\mu}dx^{ u} + R^2 \\tilde g_{mn}dy^m dy^n\n\\end{equation}7 where $\\rho(\\phi)$ can be interpreted as a vacuum number density on moduli space. To evaluate the integral over $(N,M)$ at a given fixed $\\phi$, it is convenient to make the following linear change of variables $(N,M) \\to (v',v'')$: \\begin{equation}\n\\label{ansatz}\nds^2 = g_{\\mu u} dx^{\\mu}dx^{ u} + R^2 \\tilde g_{mn}dy^m dy^n\n\\end{equation}8 This change of variables has Jacobian $=1$, and the 

### Define the prompt to create the Q&A using the text from the papers

In [144]:
# Define the number of Q&A pairs you want to generate for each chunk
num_questions = 3

In [145]:
system_prompt_template = "You are an expert in theoretical physics. I will provide a text, and I'd like you to generate {num_questions} questions a researcher-level colleague might ask about the topic of the text. Then, provide detailed answers to these questions as an expeert in the field. Format your responses as follows: 'Question 1: [question here] Answer 1: [answer here]' and so on for all {num_questions} questions."

user_prompt_template = "Based on the following text, please generate the questions and answers as instructed. Text: {chunk}"

display(system_prompt_template)
display(user_prompt_template)


"You are an expert in theoretical physics. I will provide a text, and I'd like you to generate {num_questions} questions a researcher-level colleague might ask about the topic of the text. Then, provide detailed answers to these questions as an expeert in the field. Format your responses as follows: 'Question 1: [question here] Answer 1: [answer here]' and so on for all {num_questions} questions."

'Based on the following text, please generate the questions and answers as instructed. Text: {chunk}'

### Generate the Q&A using chat-gpt 3.5 turbo

In [146]:
client = OpenAI()

# Initialize a list to store chunk and response pairs
chunk_responses = []

# Assume chunks_test is a list of text chunks you want to generate Q&A for
for chunk in chunks:
    system_prompt, user_prompt = generate_prompt(chunk, num_questions, system_prompt_template, user_prompt_template)
    
    # Call the OpenAI API once per chunk
    response = client.chat.completions.create(
        model="gpt-3.5-turbo-0125",
        messages=[system_prompt, user_prompt]
    )
    
    # Append both the chunk and its response to the chunk_responses list
    chunk_responses.append({
        "chunk": chunk,
        "response": response.choices[-1].message.content if response.choices else "No response"
    })


In [147]:
# Initialize lists to hold the DataFrame data
chunk_list = []
question_list = []
answer_list = []
sub_index = []

# Process each chunk-response pair
for item in chunk_responses:
    chunk = item['chunk']
    response = item['response']
    
    # Split the response into Q&As
    qas = response.split('\n\n')  # Assuming two newlines separate each Q&A pair
    for i, qa in enumerate(qas):
        # Attempt to split the QA into question and answer
        parts = qa.split('\nAnswer ')
        if len(parts) == 2:
            question = parts[0].replace('Question {}: '.format(i+1), '').strip()
            answer = parts[1].strip()
            chunk_list.append(chunk)
            question_list.append(question)
            answer_list.append(answer)
            sub_index.append(i+1)

In [160]:
# Create a MultiIndex from the chunks and their corresponding sub_index
multi_index = pd.MultiIndex.from_arrays([chunk_list, sub_index], names=['Chunk', 'Q&A Index'])
answer_list = [re.sub(r'^\d+: ', '', answer) for answer in answer_list]

# Construct the DataFrame
df_multi = pd.DataFrame({'Question': question_list, 'Answer': answer_list}, index=multi_index)

# Display the DataFrame
#df_multi

### Visualize the Q&A ina  dataframe

In [149]:
qa_df = pd.DataFrame({
    'Question': question_list,
    'Answer': answer_list
})

qa_df = qa_df
qa_df

Unnamed: 0,Question,Answer
0,How did the second superstring revolution of 1994-97 address the doubts surrounding string theory being defined only as a perturbative expansion and the need for non-perturbative physics in constructing a completely realistic model?,"The second superstring revolution of 1994-97 addressed these doubts by convincingly arguing that all the different string theories and eleven-dimensional supergravity are actually limits or aspects of a unified framework called string/M theory. The central idea of duality emerged, demonstrating that the strong coupling limit of one string theory can be equivalent to another weakly coupled theory, leading to a more unified understanding of the subject."
1,"What were some of the key discoveries that led particle physicists to consider superstring theory as a viable contender for a ""theory of everything""?","Some key discoveries that propelled superstring theory's candidacy for a ""theory of everything"" included the development of supersymmetric versions of the theory, arguments for perturbative finiteness, discoveries of anomaly cancellations, and quasi-realistic compactifications of the heterotic string. These advancements collectively contributed to a broad consensus among physicists that superstring theory could potentially describe all of fundamental physics."
2,How did the concept of duality play a significant role in the development and acceptance of string/M theory as a unified framework encompassing various string theories and eleven-dimensional supergravity?,"The concept of duality was crucial in the evolution of string theory towards the unified framework of string/M theory. Duality showed that seemingly distinct string theories were actually different descriptions of the same underlying physics. For example, it revealed that the strongly coupled regime of one theory could be equivalent to the weakly coupled regime of another theory. This unification through duality helped reconcile the different versions of string theory and eleven-dimensional supergravity into a singular comprehensive framework, string/M theory, contributing to a deeper understanding of the subject."
3,What is the central idea of duality in the context of string/M theory as mentioned in the text?,"The central idea of duality in string/M theory refers to the concept that the strong coupling limit of one string theory can be equivalent to another theory that is weakly coupled, including M theory. This concept reveals that seemingly distinct theories are actually different limits or aspects of one unified framework."
4,"How did the ""second superstring revolution"" from 1994-97 contribute to theoretical physics as mentioned in the text?","The ""second superstring revolution"" during 1994-97 played a crucial role in theoretical physics by providing nonperturbative definitions for string/M theory and offering exact solutions for the effective Lagrangians of various supersymmetric field theories. It introduced the idea of duality, which established connections between different string theories and led to a unified framework known as string/M theory."
...,...,...
94,How does the text relate the search for inflationary measures in theoretical physics to analogous problems in particle physics?,"The text draws an analogy between the search for inflationary measures in theoretical physics and the hypothetical scenario of developing particle physics based on data at energies far below the natural scales of the Standard Model, suggesting that advances using precision information and very powerful supercomputers could potentially lead to inferences about the validity of certain theories even at energy scales well beyond what is experimentally accessible."
95,"In the context of the text, what role do asymptotically free gauge theories coupled to gravity play in advancing theoretical physics and potentially leading to the Standard Model?","The text suggests that asymptotically free gauge theories coupled to gravity are identified as sensible candidates for explaining certain aspects of theoretical physics, with the hypothetical scenario indicating that with enough theoretical advances and computational power, it may be possible to develop models resembling the Standard Model, at least for the first generation of matter, by reproducing experimental observations such as the table of isotopes and radioactivity."
96,"What challenges are encountered when considering different field theories that might lead to similar low energy physics, and how can researchers navigate through this uncertainty?","The challenges include the difficulty of predicting how many other field theories could result in similar low energy physics, leading to a period of great uncertainty where multiple competing ideas seem valid. Researchers must navigate through this uncertainty by primarily focusing on theoretical consistency and the elegance of the proposed framework."
97,"What experimental approaches could be used to test proposals arising from field theories, particularly those related to subtle corrections and higher-energy phenomena in astrophysics?","Experimental testing of proposals from field theories could involve making precise measurements of observables like atomic masses, spectra, and radioactive decay rates to detect subtle corrections compared to Standard Model predictions. Additionally, looking for high-energy data in astrophysical phenomena, such as cosmic ray events, could provide crucial insights into the validity of these proposals."


### Save the dataframe in a csv and parquet format

In [152]:
qa_df.to_csv("Datasets/0701050.csv")
qa_df.to_parquet("Datasets/0701050.parquet")

### Upload csv datasets for further processing

In [153]:
df_test = pd.read_csv("Datasets/0701050.csv", index_col=0)
df_test

Unnamed: 0,Question,Answer
0,How did the second superstring revolution of 1994-97 address the doubts surrounding string theory being defined only as a perturbative expansion and the need for non-perturbative physics in constructing a completely realistic model?,"The second superstring revolution of 1994-97 addressed these doubts by convincingly arguing that all the different string theories and eleven-dimensional supergravity are actually limits or aspects of a unified framework called string/M theory. The central idea of duality emerged, demonstrating that the strong coupling limit of one string theory can be equivalent to another weakly coupled theory, leading to a more unified understanding of the subject."
1,"What were some of the key discoveries that led particle physicists to consider superstring theory as a viable contender for a ""theory of everything""?","Some key discoveries that propelled superstring theory's candidacy for a ""theory of everything"" included the development of supersymmetric versions of the theory, arguments for perturbative finiteness, discoveries of anomaly cancellations, and quasi-realistic compactifications of the heterotic string. These advancements collectively contributed to a broad consensus among physicists that superstring theory could potentially describe all of fundamental physics."
2,How did the concept of duality play a significant role in the development and acceptance of string/M theory as a unified framework encompassing various string theories and eleven-dimensional supergravity?,"The concept of duality was crucial in the evolution of string theory towards the unified framework of string/M theory. Duality showed that seemingly distinct string theories were actually different descriptions of the same underlying physics. For example, it revealed that the strongly coupled regime of one theory could be equivalent to the weakly coupled regime of another theory. This unification through duality helped reconcile the different versions of string theory and eleven-dimensional supergravity into a singular comprehensive framework, string/M theory, contributing to a deeper understanding of the subject."
3,What is the central idea of duality in the context of string/M theory as mentioned in the text?,"The central idea of duality in string/M theory refers to the concept that the strong coupling limit of one string theory can be equivalent to another theory that is weakly coupled, including M theory. This concept reveals that seemingly distinct theories are actually different limits or aspects of one unified framework."
4,"How did the ""second superstring revolution"" from 1994-97 contribute to theoretical physics as mentioned in the text?","The ""second superstring revolution"" during 1994-97 played a crucial role in theoretical physics by providing nonperturbative definitions for string/M theory and offering exact solutions for the effective Lagrangians of various supersymmetric field theories. It introduced the idea of duality, which established connections between different string theories and led to a unified framework known as string/M theory."
...,...,...
94,How does the text relate the search for inflationary measures in theoretical physics to analogous problems in particle physics?,"The text draws an analogy between the search for inflationary measures in theoretical physics and the hypothetical scenario of developing particle physics based on data at energies far below the natural scales of the Standard Model, suggesting that advances using precision information and very powerful supercomputers could potentially lead to inferences about the validity of certain theories even at energy scales well beyond what is experimentally accessible."
95,"In the context of the text, what role do asymptotically free gauge theories coupled to gravity play in advancing theoretical physics and potentially leading to the Standard Model?","The text suggests that asymptotically free gauge theories coupled to gravity are identified as sensible candidates for explaining certain aspects of theoretical physics, with the hypothetical scenario indicating that with enough theoretical advances and computational power, it may be possible to develop models resembling the Standard Model, at least for the first generation of matter, by reproducing experimental observations such as the table of isotopes and radioactivity."
96,"What challenges are encountered when considering different field theories that might lead to similar low energy physics, and how can researchers navigate through this uncertainty?","The challenges include the difficulty of predicting how many other field theories could result in similar low energy physics, leading to a period of great uncertainty where multiple competing ideas seem valid. Researchers must navigate through this uncertainty by primarily focusing on theoretical consistency and the elegance of the proposed framework."
97,"What experimental approaches could be used to test proposals arising from field theories, particularly those related to subtle corrections and higher-energy phenomena in astrophysics?","Experimental testing of proposals from field theories could involve making precise measurements of observables like atomic masses, spectra, and radioactive decay rates to detect subtle corrections compared to Standard Model predictions. Additionally, looking for high-energy data in astrophysical phenomena, such as cosmic ray events, could provide crucial insights into the validity of these proposals."


### Concatenate all datasets from various papers to create a single dataset about string phenomenology (and save it)

In [161]:
from sklearn.utils import shuffle

directory_path = 'Datasets/'

# Initialize a list to hold the dataframes
dataframes = []

# Iterate through all files in the directory
for filename in os.listdir(directory_path):
    if filename.endswith('.csv'):
        # Load each CSV file into a DataFrame, excluding the index
        df_temp = pd.read_csv(os.path.join(directory_path, filename), index_col=0)
        # Append the DataFrame to the list
        dataframes.append(df_temp)

# Concatenate all the DataFrames into a single DataFrame
concatenated_df = pd.concat(dataframes, ignore_index=True)

# Shuffle the rows of the concatenated DataFrame
shuffled_df = shuffle(concatenated_df)

# Reset the index to get rid of the old indexing
shuffled_df.reset_index(drop=True, inplace=True)

shuffled_df

Unnamed: 0,Question,Answer
0,"Can dS vacua be obtained in the IIB setting, and what are the methods or approaches suggested to achieve this?","Yes, it is possible to obtain de Sitter (dS) vacua in the IIB setting by incorporating additional effects from the low energy effective action or by adopting a more generalized approach to seeking minima of the effective action. Various proposals have been put forward to construct dS vacua. These proposals can be found in recent research that summarizes the state of the art in dS constructions and highlights the challenges involved. Additional strategies include incorporating anti-branes, which were originally proposed as part of the KKLT construction."
1,"What role do the slow-roll conditions play in multi-field inflation, and how do they relate to the decomposition of the inflationary trajectory into tangent and normal directions?","In multi-field inflation, the slow-roll conditions are essential for ensuring the smooth evolution of the scalar fields and the inflationary dynamics. These conditions constrain the time derivatives of the scalar fields and their gradient with respect to the potential. By utilizing a kinematic basis, one can decompose the inflationary trajectory into adiabatic (tangent) and entropic (normal) directions, which simplifies the analysis and understanding of the inflationary dynamics."
2,"How does the distribution of flux values in the model impact the number of solutions, and how does the choice of parameters affect the range of possible solutions?","The distribution of flux values in the model plays a crucial role in determining the number of solutions. The regularity in the distribution of flux values affects the intervals in which the cosmological constant falls. By making the flux values sufficiently different, one can ensure a more realistic situation. The choice of parameters, such as the size of the flux couplings and the range of the cosmological constant, influences the diversity and quantity of solutions in the model."
3,How does the inclusion of Kaluza-Klein (KK) modes within the $R^d$-dimensional theory relate to the universal quantum gravity bound and the effective theory's scale?,"Including the KK modes within the $R^d$-dimensional theory allows for a quantitative analysis of how many modes can be accommodated before reaching the universal quantum gravity bound, which is the $R^d$-dimensional Planck mass. This counting of KK modes provides insights into the effective description of higher-dimensional theories and helps ascertain the consistency and limitations of the effective field theory approach within the framework of string theory."
4,What are some of the key criticisms or challenges faced by the swampland approach and the Planckian censorship conjecture in particular?,"Some criticisms and challenges faced by the swampland approach, including the Planckian censorship conjecture, involve the speculative nature of these concepts and the lack of a clear explanatory framework for certain restrictions they propose. Critics have raised questions about the relevance of constraints on EFTs imposed by such conjectures and the need for further empirical and theoretical justifications to validate their implications. Additionally, the swampland approach has been perceived as less motivated compared to other conjectures in the field, leading to debates about its significance and impact on advancing our understanding of quantum gravity and cosmology."
...,...,...
5197,What are bifurcated throats and how do they address backreaction effects in the model mentioned in the text?,"Bifurcated throats are a theoretical construct used in string theory and braneworld scenarios where the geometry of spacetime bifurcates into separate regions resembling 'throats'. These throats can be used to address backreaction effects by providing a way to localize different types of matter fields or interactions in distinct regions, thereby mitigating the impact of backreactions."
5198,"In the context of string inflationary scenarios, what distinguishes the classes of models focused on in the text from the broader set of string-inspired models present in the literature?","The classes of models focused on in the text represent the most developed string inflationary scenarios. These models have concrete proposals within the framework of string theory and have been studied extensively in terms of their theoretical implications and observational predictions. On the other hand, the broader set of string-inspired models in the literature includes proposals that are based on ideas from string theory but may lack a solid stringy embedding or detailed mechanisms for moduli stabilization. While these broader models contribute to the diversity of ideas in the field, they may not have the same level of theoretical development and predictive power as the more focused classes of string inflation models discussed in the text."
5199,What is the significance of the DBI inflation scenario and its non-canonical kinetic terms in the context of theoretical physics?,The DBI inflation scenario is significant in theoretical physics as it presents a framework beyond the slow-roll approximation for achieving accelerated expansion. Non-canonical kinetic terms arising from the DBI action introduce new dynamics that can lead to unique inflationary phenomenology and contribute to the understanding of early universe dynamics.
5200,"What is the significance of the equation of state of dark energy changing with time, and how does it relate to inflationary cosmology?","The changing equation of state of dark energy during quintessence is significant as it can lead to an accelerated expansion of the universe. This behavior is similar to inflationary cosmology, where the equation of state of the inflaton field drives a rapid expansion in the early universe. The evolving equation of state during quintessence can lead to different behaviors of the dark energy field over time, with potential implications for the ultimate fate of the universe."


In [159]:
shuffled_df.to_csv("Datasets/StringPhenoDataset.csv")
shuffled_df.to_parquet("Datasets/StringPhenoDataset.parquet")