In [1]:
import random
import json
from groq import Groq
from time import sleep
from tqdm import tqdm

In [2]:
path = 'data/queries.json'

In [3]:
import json

with open(path, 'r', encoding='utf-8') as f:
    data = f.readlines()
    data = [json.loads(line) for line in data]

In [4]:
data[:10]

[{'id': '2205.13172',
  'submitter': 'Sergei V. Ketov',
  'authors': 'Sergei V. Ketov',
  'title': 'Starobinsky-Bel-Robinson gravity',
  'comments': '7 pages, no figures, LaTeX; major revision',
  'journal-ref': 'Universe 2022, 8, 351',
  'doi': '10.3390/universe8070351',
  'report-no': 'IPMU22-0031',
  'categories': 'gr-qc astro-ph.CO hep-th',
  'license': 'http://creativecommons.org/licenses/by/4.0/',
  'abstract': '  A novel superstring-inspired gravitational theory in four spacetime\ndimensions is proposed as a sum of the modified $(R+\\alpha R^2)$ gravity\nmotivated by the Starobinsky inflation and the Bel-Robinson-tensor-squared term\nmotivated by the eleven-dimensional M-theory dimensionally reduced to four\ndimensions. The proposed Starobinsky-Bel-Robinson action has only two\nparameters, which makes it suitable for verifiable physical applications in\nblack hole physics, cosmological inflation and Hawking radiation in the early\nuniverse.\n',
  'versions': [{'version': 'v1', '

In [5]:
from AuthKey import GROQ_API_KEY

client = Groq(
    api_key=GROQ_API_KEY,
)

In [71]:
def evaluate_articles_boolean(artigos, 
                      query,
                      model = 'llama3-70b-8192',
                      max_tokens = 1000,
                      verbose = True):
    """
    artigos: list of dictionaries with the following keys: 'title', 'abstract'
    query: string with the query that the articles will be evaluated against

    Returns a list of dictionaries with the following keys: 'title', 'abstract', 'eval', where 'eval' is a boolean value where 1 means relevant and 0 means not relevant to the query    
    """

    evaluated = []
    if verbose: print("Query:", query)

    for artigo in tqdm(artigos, desc="Evaluating articles"):
        prompt = f"Read the following article, named '{artigo['title']}', with the following content: \n {artigo['abstract']} \n \
                Evaluate if the article is relevant to the following query, and don't be strict about your classification: {query} \n"

        while True:
            try:
                response = client.chat.completions.create(
                    model=model,
                    n=1,
                    messages=[
                        {"role": "user", "content": "You are an assistant AI specialized in evaluating articles based on a given query. \
                        Your goal is to evaluate an article's relevance based on a search query. You should return only the number 1 or 0, where 1 means true and 0 means false, \
                        based on whether the article is at least slightly relevant to a given query. If the article is related to the same field, it is enough for it to be considered relevant. For example: \n \
                        Read the following article, named 'Increased lifespan on athletes', with the following content: \n Sports practicing has been shown to increase lifespawn and health. \n\
                        Evaluate if the article is relevant to the following query: Positive health impacts on volleyball practice. \n \
                        Response: 1"},
                        {"role": "user", "content": prompt}
                    ],
                    max_tokens = max_tokens)
                if int(response.choices[0].message.content.lower()) in [0, 1]:
                    evaluated.append({'title': artigo['title'], 'abstract': artigo['abstract'], 'eval': response.choices[0].message.content.lower()})
                    if verbose: print(f"Article '{artigo['title']}' evaluated as {response.choices[0].message.content.lower()}")
                    break
                else:
                    print("Invalid response, trying again.")
            except Exception as e:
                print("Rate limit achieved:", e)
                sleep(30)
                continue
    return evaluated

In [46]:
query = data[99]['query']
query

'transformer-based models for optimizing ranked list truncation in information retrieval'

In [50]:
evaluated = evaluate_articles_boolean(data, query)

Query: transformer-based models for optimizing ranked list truncation in information retrieval


Evaluating articles:   1%|          | 1/100 [00:00<00:42,  2.35it/s]

Article 'Starobinsky-Bel-Robinson gravity' evaluated as 0


Evaluating articles:   2%|▏         | 2/100 [00:00<00:37,  2.59it/s]

Article 'Deep Convolutional Neural Networks Model-based Brain Tumor Detection in
  Brain MRI Images' evaluated as 0


Evaluating articles:   3%|▎         | 3/100 [00:01<00:43,  2.25it/s]

Article 'A Theory-Based Evaluation of Nearest Neighbor Models Put Into Practice' evaluated as 0


Evaluating articles:   4%|▍         | 4/100 [00:01<00:39,  2.44it/s]

Article 'Transfer and Share: Semi-Supervised Learning from Long-Tailed Data' evaluated as 0


Evaluating articles:   5%|▌         | 5/100 [00:05<02:26,  1.54s/it]

Article 'Biharmonic homogeneous polynomial maps between spheres' evaluated as 0


Evaluating articles:   6%|▌         | 6/100 [00:15<07:17,  4.66s/it]

Article 'Integration of Blockchain and Edge Computing in Internet of Things: A
  Survey' evaluated as 0


Evaluating articles:   7%|▋         | 7/100 [00:24<09:15,  5.97s/it]

Article 'Multi-fidelity power flow solver' evaluated as 0


Evaluating articles:   8%|▊         | 8/100 [00:34<11:04,  7.23s/it]

Article 'Automatic Detection of ECG Abnormalities by using an Ensemble of Deep
  Residual Networks with Attention' evaluated as 0


Evaluating articles:   9%|▉         | 9/100 [00:44<12:10,  8.03s/it]

Article 'Determination of the $N_f=12$ step scaling function using M\"obius
  domain wall fermions' evaluated as 0


Evaluating articles:  10%|█         | 10/100 [00:48<10:27,  6.97s/it]

Article 'DDet: Dual-path Dynamic Enhancement Network for Real-World Image
  Super-Resolution' evaluated as 0


Evaluating articles:  11%|█         | 11/100 [00:57<11:12,  7.56s/it]

Article 'Thermalizing two identical particles' evaluated as 0


Evaluating articles:  12%|█▏        | 12/100 [01:06<11:34,  7.90s/it]

Article 'Development of Transition-Edge Sensor X-ray Microcalorimeter Linear
  Array for Compton Scattering and Energy Dispersive Diffraction Imaging' evaluated as 0


Evaluating articles:  13%|█▎        | 13/100 [01:10<09:38,  6.65s/it]

Article 'Multiple representations of real numbers on self-similar sets with
  overlaps' evaluated as 0


Evaluating articles:  14%|█▍        | 14/100 [01:19<10:32,  7.35s/it]

Article 'Lying on networks: The role of structure and topology in promoting
  honesty' evaluated as 0


Evaluating articles:  15%|█▌        | 15/100 [01:23<09:14,  6.52s/it]

Article 'Elevated ionizing photon production efficiency in faint
  high-equivalent-width Lyman-alpha emitters' evaluated as 0


Evaluating articles:  16%|█▌        | 16/100 [01:33<10:27,  7.47s/it]

Article 'Don't shoot butterfly with rifles: Multi-channel Continuous Speech
  Separation with Early Exit Transformer' evaluated as 0


Evaluating articles:  17%|█▋        | 17/100 [01:39<09:35,  6.94s/it]

Article 'Unpredictable repeatability in molecular evolution' evaluated as 0


Evaluating articles:  18%|█▊        | 18/100 [01:47<10:11,  7.46s/it]

Article 'Simplex-averaged finite element methods for $H({\rm grad})$, $H({\rm
  curl})$ and $H({\rm div})$ convection-diffusion problems' evaluated as 0


Evaluating articles:  19%|█▉        | 19/100 [01:56<10:33,  7.82s/it]

Article 'Fourier transform detection of weak optical transitions with cyclic
  routines' evaluated as 0


Evaluating articles:  20%|██        | 20/100 [02:02<09:33,  7.17s/it]

Article 'sBSNN: Stochastic-Bits Enabled Binary Spiking Neural Network with
  On-Chip Learning for Energy Efficient Neuromorphic Computing at the Edge' evaluated as 0


Evaluating articles:  21%|██        | 21/100 [02:04<07:36,  5.78s/it]

Article 'Which Generation Shows the Most Prudent Data Sharing Behaviour?' evaluated as 0


Evaluating articles:  22%|██▏       | 22/100 [02:13<08:43,  6.71s/it]

Article 'A New Charter of Ethics and Rights of Artificial Consciousness in a
  Human World' evaluated as 0


Evaluating articles:  23%|██▎       | 23/100 [02:17<07:23,  5.76s/it]

Article 'X-ray measurement model incorporating energy-correlated material
  variability and its application in information-theoretic system analysis' evaluated as 0


Evaluating articles:  24%|██▍       | 24/100 [02:21<06:51,  5.41s/it]

Article 'Superconductor-metal quantum transition at the EuO-KTaO3 interface' evaluated as 0


Evaluating articles:  25%|██▌       | 25/100 [02:31<08:21,  6.69s/it]

Article 'Efficient Inverse-Free Incremental and Decremental Algorithms for
  Multiple Hidden Nodes in Extreme Learning Machine' evaluated as 0


Evaluating articles:  26%|██▌       | 26/100 [02:41<09:21,  7.59s/it]

Article 'Fingerprints of giant planets in the composition of solar twins' evaluated as 0


Evaluating articles:  27%|██▋       | 27/100 [02:51<10:21,  8.52s/it]

Article 'Few-Shot Adaptation of Generative Adversarial Networks' evaluated as 0


Evaluating articles:  28%|██▊       | 28/100 [03:00<10:16,  8.56s/it]

Article 'Lamina-specific neuronal properties promote robust, stable signal
  propagation in feedforward networks' evaluated as 0


Evaluating articles:  29%|██▉       | 29/100 [03:06<09:07,  7.71s/it]

Article 'BCFT entanglement entropy at large central charge and the black hole
  interior' evaluated as 0


Evaluating articles:  30%|███       | 30/100 [03:08<07:11,  6.16s/it]

Article 'Longitudinal tension and mechanical stability of a pressurized straw
  tube' evaluated as 0


Evaluating articles:  31%|███       | 31/100 [03:17<08:06,  7.05s/it]

Article 'MeshAdv: Adversarial Meshes for Visual Recognition' evaluated as 0


Evaluating articles:  32%|███▏      | 32/100 [03:23<07:33,  6.67s/it]

Article 'Automatic Segmentation, Feature Extraction and Comparison of Healthy and
  Stroke Cerebral Vasculature' evaluated as 0


Evaluating articles:  33%|███▎      | 33/100 [03:29<07:08,  6.39s/it]

Article 'How Phonotactics Affect Multilingual and Zero-shot ASR Performance' evaluated as 0


Evaluating articles:  34%|███▍      | 34/100 [03:32<05:48,  5.28s/it]

Article 'Constraining annihilating dark matter by radio continuum spectrum of the
  Large Magellanic Cloud' evaluated as 0


Evaluating articles:  35%|███▌      | 35/100 [03:37<05:51,  5.41s/it]

Article 'Contrastive Learning with Adversarial Examples' evaluated as 0


Evaluating articles:  36%|███▌      | 36/100 [03:45<06:30,  6.09s/it]

Article 'DeeBERT: Dynamic Early Exiting for Accelerating BERT Inference' evaluated as 1


Evaluating articles:  37%|███▋      | 37/100 [03:54<07:12,  6.87s/it]

Article 'Listening for Sirens: Locating and Classifying Acoustic Alarms in City
  Scenes' evaluated as 0


Evaluating articles:  38%|███▊      | 38/100 [04:04<08:18,  8.04s/it]

Article 'Transient chaotic dimensionality expansion by recurrent networks' evaluated as 0


Evaluating articles:  39%|███▉      | 39/100 [04:09<07:08,  7.02s/it]

Article 'Ergodic Achievable Rate Maximization of RIS-assisted Millimeter-Wave
  MIMO-OFDM Communication Systems' evaluated as 0
Rate limit achieved: invalid literal for int() with base 10: '0 \n\nthis article is not relevant to the query about transformer-based models for optimizing ranked list truncation in information retrieval. the article is focused on a deep learning guided fuzzing


Evaluating articles:  40%|████      | 40/100 [04:50<17:03, 17.05s/it]

Article 'DeFuzz: Deep Learning Guided Directed Fuzzing' evaluated as 0


Evaluating articles:  41%|████      | 41/100 [04:50<11:51, 12.05s/it]

Article 'Inherently stable effective field theory for dark energy and modified
  gravity' evaluated as 0


Evaluating articles:  42%|████▏     | 42/100 [04:50<08:15,  8.54s/it]

Article 'On complexity of representations of quivers' evaluated as 0


Evaluating articles:  43%|████▎     | 43/100 [04:51<05:46,  6.08s/it]

Article 'Quantum Formation of Primordial Black holes' evaluated as 0


Evaluating articles:  44%|████▍     | 44/100 [04:53<04:43,  5.07s/it]

Article 'Tree Reconstruction using Topology Optimisation' evaluated as 0


Evaluating articles:  45%|████▌     | 45/100 [04:59<04:43,  5.15s/it]

Article 'Deep Learning for Ultra-Reliable and Low-Latency Communications in 6G
  Networks' evaluated as 0


Evaluating articles:  46%|████▌     | 46/100 [05:03<04:29,  4.98s/it]

Article 'Active galactic nuclei ghosts: A systematic search for faded nuclei' evaluated as 0


Evaluating articles:  47%|████▋     | 47/100 [05:12<05:22,  6.08s/it]

Article 'Nonbinary Error-Detecting Hybrid Codes' evaluated as 0


Evaluating articles:  48%|████▊     | 48/100 [05:21<05:56,  6.86s/it]

Article 'Interactive Movement Primitives: Planning to Push Occluding Pieces for
  Fruit Picking' evaluated as 0


Evaluating articles:  49%|████▉     | 49/100 [05:30<06:33,  7.71s/it]

Article 'Pb-doped p-type Bi$_2$Se$_3$ thin films via interfacial engineering' evaluated as 0


Evaluating articles:  50%|█████     | 50/100 [05:34<05:22,  6.46s/it]

Article 'Growth of nonsymmetric operads' evaluated as 0


Evaluating articles:  51%|█████     | 51/100 [05:43<05:53,  7.21s/it]

Article 'Optimizing Electric Multiple Unit Circulation Plan within Maintenance
  Constraints for High-Speed Railway System' evaluated as 0


Evaluating articles:  52%|█████▏    | 52/100 [05:46<04:53,  6.12s/it]

Article 'Near-field imaging of surface-plasmon vortex-modes around a single
  elliptical nanohole in a gold film' evaluated as 0


Evaluating articles:  53%|█████▎    | 53/100 [05:55<05:30,  7.02s/it]

Article 'Driven translocation of a semiflexible polymer through a conical channel
  in the presence of attractive surface interactions' evaluated as 0


Evaluating articles:  54%|█████▍    | 54/100 [06:03<05:31,  7.21s/it]

Article 'The Accuracy of Restricted Boltzmann Machine Models of Ising Systems' evaluated as 0


Evaluating articles:  55%|█████▌    | 55/100 [06:11<05:33,  7.40s/it]

Article 'See saw mechanism with Yukawa alignment for neutrinos' evaluated as 0


Evaluating articles:  56%|█████▌    | 56/100 [06:14<04:27,  6.09s/it]

Article 'Game Values of Strong Placement Games' evaluated as 0


Evaluating articles:  57%|█████▋    | 57/100 [06:20<04:16,  5.97s/it]

Article 'On the centralizer of vector fields: criteria of triviality and
  genericity results' evaluated as 0


Evaluating articles:  58%|█████▊    | 58/100 [06:25<04:07,  5.88s/it]

Article 'Attacks Which Do Not Kill Training Make Adversarial Learning Stronger' evaluated as 0


Evaluating articles:  59%|█████▉    | 59/100 [06:30<03:45,  5.51s/it]

Article 'SymNMF-Net for The Symmetric NMF Problem' evaluated as 0


Evaluating articles:  60%|██████    | 60/100 [06:39<04:18,  6.45s/it]

Article 'Vibrational Heat-Bath Configuration Interaction' evaluated as 0


Evaluating articles:  61%|██████    | 61/100 [06:42<03:39,  5.62s/it]

Article 'A unified view of space-time covariance functions through Gelfand pairs' evaluated as 0


Evaluating articles:  62%|██████▏   | 62/100 [06:52<04:20,  6.84s/it]

Article 'Grasping as Inference: Reactive Grasping in Heavily Cluttered
  Environment' evaluated as 0


Evaluating articles:  63%|██████▎   | 63/100 [06:57<03:49,  6.21s/it]

Article 'The Case for Learning Application Behavior to Improve Hardware Energy
  Efficiency' evaluated as 0


Evaluating articles:  64%|██████▍   | 64/100 [07:02<03:37,  6.05s/it]

Article 'Cost-Optimal Laser-Accelerated Lightsails' evaluated as 0


Evaluating articles:  65%|██████▌   | 65/100 [07:07<03:17,  5.66s/it]

Article 'Nonreciprocal directional dichroism induced by a temperature gradient as
  a probe for mobile spin dynamics in quantum magnets' evaluated as 0


Evaluating articles:  66%|██████▌   | 66/100 [07:12<03:01,  5.34s/it]

Article 'A broadband achromatic polarization-insensitive metalens consisting of
  anisotropic nanostructures' evaluated as 0


Evaluating articles:  67%|██████▋   | 67/100 [07:19<03:20,  6.07s/it]

Article 'Asymptotic Expansions of The Traces of the Thermoelastic Operators' evaluated as 0


Evaluating articles:  68%|██████▊   | 68/100 [07:25<03:10,  5.95s/it]

Article 'On Eventually Periodic Sets as Minimal Additive Complements' evaluated as 0


Evaluating articles:  69%|██████▉   | 69/100 [07:29<02:42,  5.23s/it]

Article 'Two-phonon structures for beta-decay theory' evaluated as 0


Evaluating articles:  70%|███████   | 70/100 [07:37<03:07,  6.26s/it]

Article 'Symbiotic Child Emotional Support with Social Robots and Temporal
  Knowledge Graphs' evaluated as 0


Evaluating articles:  71%|███████   | 71/100 [07:42<02:47,  5.77s/it]

Article 'High Tc superconductivity in heavy Rare Earth Hydrides: correlation
  between the presence of the f states on the Fermi surface, nesting and the
  value of Tc' evaluated as 0


Evaluating articles:  72%|███████▏  | 72/100 [07:54<03:31,  7.56s/it]

Article 'Diffusion in the presence of correlated dynamical disorder and coherent
  exciton transfer in the non-Markovian limit' evaluated as 0


Evaluating articles:  73%|███████▎  | 73/100 [07:58<03:00,  6.70s/it]

Article 'Continuous-time multi-state capture-recapture models' evaluated as 0


Evaluating articles:  74%|███████▍  | 74/100 [08:08<03:17,  7.59s/it]

Article 'A panoramic landscape of the Sagittarius stream in Gaia DR2 revealed
  with the STREAMFINDER spyglass' evaluated as 0


Evaluating articles:  75%|███████▌  | 75/100 [08:12<02:40,  6.41s/it]

Article 'Application of the iterative reconstruction to simulated galaxy fields' evaluated as 0


Evaluating articles:  76%|███████▌  | 76/100 [08:19<02:36,  6.51s/it]

Article 'Model Watermarking for Image Processing Networks' evaluated as 0


Evaluating articles:  77%|███████▋  | 77/100 [08:28<02:53,  7.55s/it]

Article 'Numerical approximation of elliptic problems with log-normal random
  coefficients' evaluated as 0


Evaluating articles:  78%|███████▊  | 78/100 [08:33<02:26,  6.66s/it]

Article 'A search for cosmological anisotropy using the Lyman alpha forest from
  SDSS quasar spectra' evaluated as 0


Evaluating articles:  79%|███████▉  | 79/100 [08:38<02:06,  6.04s/it]

Article 'An Inertial Block Majorization Minimization Framework for Nonsmooth
  Nonconvex Optimization' evaluated as 0


Evaluating articles:  80%|████████  | 80/100 [08:41<01:44,  5.22s/it]

Article 'Big Quantum cohomology of orbifold spheres' evaluated as 0


Evaluating articles:  81%|████████  | 81/100 [08:45<01:32,  4.88s/it]

Article 'Synchrotron radiation from a charge circulating around a cylinder with
  negative permittivity' evaluated as 0


Evaluating articles:  82%|████████▏ | 82/100 [08:50<01:26,  4.83s/it]

Article 'Novel Cascaded Gaussian Mixture Model-Deep Neural Network Classifier for
  Speaker Identification in Emotional Talking Environments' evaluated as 0


Evaluating articles:  83%|████████▎ | 83/100 [08:58<01:38,  5.82s/it]

Article 'A Note About the {Ki(z)} Functions' evaluated as 0


Evaluating articles:  84%|████████▍ | 84/100 [09:01<01:22,  5.14s/it]

Article 'Understanding Metrics for Paraphrasing' evaluated as 0


Evaluating articles:  85%|████████▌ | 85/100 [09:06<01:12,  4.83s/it]

Article 'Single Crystal Growth of Cuprate Superconductor
  (Lu$_{0.8}$Nd$_{0.2}$)Ba$_2$Cu$_4$O$_8$ by KOH Flux Method' evaluated as 0


Evaluating articles:  86%|████████▌ | 86/100 [09:11<01:11,  5.08s/it]

Article 'Nonlinear Stochastic Trajectory Optimization for Centroidal Momentum
  Motion Generation of Legged Robots' evaluated as 0


Evaluating articles:  87%|████████▋ | 87/100 [09:15<01:00,  4.63s/it]

Article 'Leveraging Causal Inference for Explainable Automatic Program Repair' evaluated as 0


Evaluating articles:  88%|████████▊ | 88/100 [09:19<00:55,  4.62s/it]

Article 'Temporal Attention-Augmented Graph Convolutional Network for Efficient
  Skeleton-Based Human Action Recognition' evaluated as 0


Evaluating articles:  89%|████████▉ | 89/100 [09:24<00:50,  4.60s/it]

Article 'Control Design of Autonomous Drone Using Deep Learning Based Image
  Understanding Techniques' evaluated as 0


Evaluating articles:  90%|█████████ | 90/100 [09:27<00:39,  3.99s/it]

Article 'Rigidity for rigid analytic motives' evaluated as 0


Evaluating articles:  91%|█████████ | 91/100 [09:34<00:45,  5.09s/it]

Article 'Sizing the White Whale' evaluated as 0


Evaluating articles:  92%|█████████▏| 92/100 [09:42<00:48,  6.01s/it]

Article 'Regularized maximal fidelity of the generalized Pauli channels' evaluated as 0


Evaluating articles:  93%|█████████▎| 93/100 [09:49<00:43,  6.21s/it]

Article 'Fighting Contextual Bandits with Stochastic Smoothing' evaluated as 0


Evaluating articles:  94%|█████████▍| 94/100 [09:54<00:34,  5.79s/it]

Article 'Acute Lymphoblastic Leukemia Detection Using Hypercomplex-Valued
  Convolutional Neural Networks' evaluated as 0


Evaluating articles:  95%|█████████▌| 95/100 [10:02<00:32,  6.41s/it]

Article 'The profinite completion of relatively hyperbolic virtually special
  groups' evaluated as 0


Evaluating articles:  96%|█████████▌| 96/100 [10:11<00:28,  7.18s/it]

Article 'On-Shell Electric-Magnetic Duality and the Dual Graviton' evaluated as 0


Evaluating articles:  97%|█████████▋| 97/100 [10:18<00:21,  7.32s/it]

Article 'A stationary heat conduction problem' evaluated as 0


Evaluating articles:  98%|█████████▊| 98/100 [10:23<00:12,  6.49s/it]

Article 'Small-mass naked singularities censored by the Higgs field' evaluated as 0


Evaluating articles:  99%|█████████▉| 99/100 [10:29<00:06,  6.25s/it]

Article 'Thermal Instability of Halo Gas Heated by Streaming Cosmic Rays' evaluated as 0


Evaluating articles: 100%|██████████| 100/100 [10:33<00:00,  6.34s/it]

Article 'Choppy: Cut Transformer For Ranked List Truncation' evaluated as 1





In [54]:
import pandas as pd
evaluated_df = pd.DataFrame(evaluated)

In [55]:
evaluated_df[evaluated_df['eval'] == '1']

Unnamed: 0,title,abstract,eval
35,DeeBERT: Dynamic Early Exiting for Acceleratin...,Large-scale pre-trained language models such...,1
99,Choppy: Cut Transformer For Ranked List Trunca...,Work in information retrieval has traditiona...,1


In [77]:
import json

In [107]:
def get_initial_response(prompt, model = 'llama3-70b-8192', max_tokens = 1000):
    while True:
        try:
            response = client.chat.completions.create(
                model=model,
                n=1,
                messages=[
                    {"role": "user", "content": "You are an assistant AI specialized in evaluating articles based on a given query. \
                    Your goal is to evaluate an article's relevance based on a search query. You should return only one of the following integers: 0, 1, 2, or 3. \
                    0 means that the article has absolutely no relevance for the query. \
                    1 means that the article is only very slightly relevant to the query, sharing at most a similar topic. \
                    2 means that the article is relevant to the query, sharing many similarities, but it's still not entirely relevant to the query. \
                    3 means that the article is completely relevant to the query. \
                    For example: \n \
                    Read the following article, named 'Increased lifespan on athletes', with the following content: \n Sports practicing has been shown to increase lifespawn and health. \n\
                    Evaluate how relevant the article is to the following query: Positive health impacts on volleyball practice. \n \
                    Response: 2"},
                    {"role": "user", "content": prompt}
                ],
                max_tokens = max_tokens)
            return response.choices[0].message.content.lower()
        except Exception as e:
            print("Error when generating initial response:", e)
            sleep(30)
            continue

In [111]:
def get_feedback(artigo, query, response, model = 'llama3-70b-8192', max_tokens = 1000):
    while True:
        try:
            feedback = client.chat.completions.create(
                model=model,
                n=1,
                messages=[
                    {"role": "user", "content": f"You are an assistant AI specialized in reevaluating articles based on a given query. \
                    Your goal is to reevaluate the classification given by the previous assistant, about an article's relevance based on a search query. The relevance levels are: \
                    0 means that the article has absolutely no relevance for the query. \
                    1 means that the article is only very slightly relevant to the query, sharing at most a similar topic. \
                    2 means that the article is relevant to the query, sharing many similarities, but it's still not entirely relevant to the query. \
                    3 means that the article is completely relevant to the query. \
                    The article, titled '{artigo['title']}', has the following content: \n {artigo['abstract']} \n \
                    The query is: {query} \n \
                    The previous evaluation is: {response} \n \
                    Do you agree with the previous evaluation? \
                    Try to avoid extreme answers like 0 or 3 unless you are sure that is the case. \
                    Write your answer in the following json structure, where 'explanation' represents your reasoning, and 'eval' represents your evaluation: \n \
                    {{\"explanation\": \"your explanation\", \"eval\": \"your evaluation, needs to be exactly 0, 1, 2, or 3.\"\}}"}
                ],
                max_tokens = max_tokens)
            return feedback.choices[0].message.content.lower()
        except Exception as e:
            print("Error when generating feedback:", e)
            sleep(30)
            continue

In [112]:
def get_feedback_json(artigo, query, response, model = 'llama3-70b-8192', max_tokens = 1000):
    while True:
        try:
            feedback = get_feedback(artigo, query, response, model, max_tokens)
            dict = json.loads(feedback)
            dict['eval'] = int(dict['eval'])
            if dict['eval'] in [0, 1, 2, 3]:
                return dict
            else:
                raise Exception("Invalid evaluation: ", dict['eval'])
        except Exception as e:
            print("Error when parsing feedback:", e)

In [113]:
def evaluate_articles_levels(artigos, 
                      query,
                      model = 'llama3-70b-8192',
                      max_tokens = 1000,
                      verbose = True):
    """
    artigos: list of dictionaries with the following keys: 'title', 'abstract'
    query: string with the query that the articles will be evaluated against

    Returns a list of dictionaries with the following keys: 'title', 'abstract', 'eval', 
    where 'eval' is an integer from 0 to 3 where 0 means no relevance, 1 is very slightly relevant,
    2 is relevant, and 3 means completely relevant to the query    
    """

    evaluated = []
    if verbose: print("Query:", query)

    for artigo in tqdm(artigos, desc="Evaluating articles"):
        prompt = f"Read the following article, named '{artigo['title']}', with the following content: \n {artigo['abstract']} \n \
                Evaluate how relevant the article is to the following query: {query} \n"

        response = get_initial_response(prompt, model, max_tokens)

        feedback = get_feedback_json(artigo, query, response, model, max_tokens)
        
        if verbose: print(f"Article: '{artigo['title']}'\n Classification: {feedback}")
        evaluated.append({'title': artigo['title'], 'abstract': artigo['abstract'], 'eval': feedback['eval']})
    return evaluated

In [114]:
evaluated = evaluate_articles_levels(data, query)

Query: transformer-based models for optimizing ranked list truncation in information retrieval


Evaluating articles:   1%|          | 1/100 [00:01<03:04,  1.86s/it]

Article: 'Starobinsky-Bel-Robinson gravity'
 Classification: {'explanation': 'the article discusses a novel gravitational theory inspired by superstring theory, which has no apparent connection to transformer-based models or optimizing ranked list truncation in information retrieval. the topics are unrelated, and the article does not mention anything related to the query. however, the query is specific to a particular area of information retrieval, and the article is about a completely different field of research. therefore, i agree with the previous evaluation.', 'eval': 0}


Evaluating articles:   2%|▏         | 2/100 [00:03<02:59,  1.83s/it]

Article: 'Deep Convolutional Neural Networks Model-based Brain Tumor Detection in
  Brain MRI Images'
 Classification: {'explanation': 'i agree with the previous evaluation that the article is not directly related to the query about transformer-based models for optimizing ranked list truncation in information retrieval. the article discusses brain tumor detection using deep convolutional neural networks, which is a different topic in the field of medical science. however, i would rate the relevance as 1 instead of 0, as both topics share a common ground in machine learning and neural networks, although the application domains are different.', 'eval': 1}


Evaluating articles:   3%|▎         | 3/100 [00:16<11:20,  7.01s/it]

Article: 'A Theory-Based Evaluation of Nearest Neighbor Models Put Into Practice'
 Classification: {'explanation': 'i agree with the previous evaluation that the article is not directly related to transformer-based models or optimizing ranked list truncation in information retrieval. the article focuses on k-nearest neighbors models and their evaluation, which is a different topic from the query. however, i would rate the relevance as 1 instead of 0, because both topics are related to data analysis and processing, sharing a similar topic of data processing, even though the connection is not direct.', 'eval': 1}


Evaluating articles:   4%|▍         | 4/100 [00:29<14:38,  9.15s/it]

Article: 'Transfer and Share: Semi-Supervised Learning from Long-Tailed Data'
 Classification: {'explanation': 'i agree with the previous evaluation that the article is not relevant to the query. the article focuses on semi-supervised learning for long-tailed data, whereas the query is about transformer-based models for optimizing ranked list truncation in information retrieval. there is no mention of transformers, information retrieval, or ranked list truncation in the article, making it unrelated to the query.', 'eval': 0}


Evaluating articles:   5%|▌         | 5/100 [00:45<18:17, 11.55s/it]

Article: 'Biharmonic homogeneous polynomial maps between spheres'
 Classification: {'explanation': 'the article appears to be focused on mathematical concepts and proofs related to biharmonic maps and polynomial maps between spheres, whereas the query is about transformer-based models for optimizing ranked list truncation in information retrieval. there is no apparent connection between the two topics, making the article irrelevant to the query.', 'eval': 0}


Evaluating articles:   6%|▌         | 6/100 [01:03<21:39, 13.82s/it]

Article: 'Integration of Blockchain and Edge Computing in Internet of Things: A
  Survey'
 Classification: {'explanation': "i agree with the previous evaluation that the article is not directly related to the query. the article discusses the integration of blockchain and edge computing in iot applications, whereas the query is about transformer-based models for optimizing ranked list truncation in information retrieval. there is no apparent connection between the two topics. however, i wouldn't rate it a 0, as both topics are related to technology and computing, sharing a similar topic even if it's a broad and distant connection.", 'eval': 1}


Evaluating articles:   7%|▋         | 7/100 [01:17<21:48, 14.06s/it]

Article: 'Multi-fidelity power flow solver'
 Classification: {'explanation': "the article discusses a multi-fidelity neural network for power flow simulations and contingency analysis, which has no apparent connection to transformer-based models or ranked list truncation in information retrieval. the topics and domains are completely different, making the article not relevant to the query. however, i wouldn't rate it as 0 (absolutely no relevance), as both topics involve complex computational models, which is a very loose connection. hence, i rate it as 1, meaning the article is only very slightly relevant to the query.", 'eval': 1}


Evaluating articles:   8%|▊         | 8/100 [01:38<24:53, 16.24s/it]

Article: 'Automatic Detection of ECG Abnormalities by using an Ensemble of Deep
  Residual Networks with Attention'
 Classification: {'explanation': "i agree with the previous evaluation that the article is not relevant to the query about transformer-based models for optimizing ranked list truncation in information retrieval. the article is focused on using deep residual networks with attention for automatic detection of ecg abnormalities in the medical/healthcare domain, which is a completely different topic. there is no mention of transformer-based models or information retrieval in the article. however, i wouldn't rate it as a 0, as it's still a topic related to ai/ml, even if it's in a different domain. therefore, i would rate it as 1, indicating that the article is only very slightly relevant to the query.", 'eval': 1}


Evaluating articles:   9%|▉         | 9/100 [01:55<24:51, 16.39s/it]

Article: 'Determination of the $N_f=12$ step scaling function using M\"obius
  domain wall fermions'
 Classification: {'explanation': 'i concur with the previous evaluation that the article is unrelated to the query. the article focuses on particle physics and computational methods, specifically using domain wall fermions and gauge actions, whereas the query is about transformer-based models in information retrieval, which is a distinct field. there is no mention or connection between the two topics.', 'eval': 0}


Evaluating articles:  10%|█         | 10/100 [02:12<25:01, 16.68s/it]

Article: 'DDet: Dual-path Dynamic Enhancement Network for Real-World Image
  Super-Resolution'
 Classification: {'explanation': 'the article discusses a dual-path dynamic enhancement network for real-world image super-resolution, which is unrelated to the query about transformer-based models for optimizing ranked list truncation in information retrieval. the topics and techniques mentioned in the article, such as image super-resolution, convolutional blocks, and dynamic attention, are not relevant to the query. therefore, i agree with the previous evaluation.', 'eval': 0}


Evaluating articles:  11%|█         | 11/100 [02:21<21:03, 14.20s/it]

Article: 'Thermalizing two identical particles'
 Classification: {'explanation': 'i completely agree with the previous evaluation. the article discusses quantum mechanics and statistical physics, which are unrelated to transformer-based models in information retrieval. there is no apparent connection or similarity between the two topics. the article does not mention anything related to transformers, models, optimization, ranked lists, truncation, or information retrieval, which are the key concepts in the query. the topics are completely divergent.', 'eval': 0}


Evaluating articles:  12%|█▏        | 12/100 [02:31<18:58, 12.94s/it]

Article: 'Development of Transition-Edge Sensor X-ray Microcalorimeter Linear
  Array for Compton Scattering and Energy Dispersive Diffraction Imaging'
 Classification: {'explanation': 'the article is about the development of a transition-edge sensor microcalorimeter linear array for x-ray diffraction imaging and compton scattering applications, which has no apparent connection to transformer-based models or optimizing ranked list truncation in information retrieval. the topics and terminology used in the article are unrelated to the query, making it irrelevant to the search query.', 'eval': 0}


Evaluating articles:  13%|█▎        | 13/100 [02:51<22:03, 15.22s/it]

Article: 'Multiple representations of real numbers on self-similar sets with
  overlaps'
 Classification: {'explanation': 'i completely agree with the previous evaluation. the article is a mathematical paper that deals with representations of real numbers on self-similar sets with overlaps, which has no apparent connection to the query about transformer-based models for optimizing ranked list truncation in information retrieval. the topics are vastly different and there is no mention of the query-related topics in the article.', 'eval': 0}


Evaluating articles:  14%|█▍        | 14/100 [03:16<26:03, 18.18s/it]

Article: 'Lying on networks: The role of structure and topology in promoting
  honesty'
 Classification: {'explanation': 'the article discusses the dynamics of lying in networks, while the query is about transformer-based models for optimizing ranked list truncation in information retrieval. the topics are completely unrelated, and there is no mention of any of the concepts mentioned in the query in the article. therefore, the article has absolutely no relevance to the query.', 'eval': 0}


Evaluating articles:  15%|█▌        | 15/100 [03:36<26:30, 18.71s/it]

Article: 'Elevated ionizing photon production efficiency in faint
  high-equivalent-width Lyman-alpha emitters'
 Classification: {'explanation': 'i agree with the previous evaluation. the article is from the field of astrophysics and discusses topics that are unrelated to the query, which is about transformer-based models for optimizing ranked list truncation in information retrieval. there is no mention or connection to the concepts in the query, making the article irrelevant to the query.', 'eval': 0}


Evaluating articles:  16%|█▌        | 16/100 [04:00<28:21, 20.25s/it]

Article: 'Don't shoot butterfly with rifles: Multi-channel Continuous Speech
  Separation with Early Exit Transformer'
 Classification: {'explanation': 'while the article primarily discusses the application of transformers in speech separation, it does mention the modeling capacity of transformers, which could be potentially relevant to optimizing ranked list truncation in information retrieval. however, the connection is still quite distant, and the article does not directly address the topic of the query.', 'eval': 1}


Evaluating articles:  17%|█▋        | 17/100 [04:18<26:59, 19.52s/it]

Article: 'Unpredictable repeatability in molecular evolution'
 Classification: {'explanation': "i agree with the previous evaluation that the article is unrelated to the query. the article discusses molecular evolution, genotypic level, and fitness effects, which have no connection to transformer-based models or optimizing ranked list truncation in information retrieval. the topics are fundamentally different, and the article does not mention anything related to the query. the article's content is focused on biological and evolutionary concepts, while the query is about information retrieval and transformer-based models. there is no overlap or similarity between the two.", 'eval': 0}


Evaluating articles:  18%|█▊        | 18/100 [04:26<22:07, 16.19s/it]

Article: 'Simplex-averaged finite element methods for $H({\rm grad})$, $H({\rm
  curl})$ and $H({\rm div})$ convection-diffusion problems'
 Classification: {'explanation': 'the article is about finite element methods for convection-diffusion problems, which is a completely different field from information retrieval and transformer-based models. the query is about optimizing ranked list truncation in information retrieval, which is unrelated to the topic of the article. therefore, i agree with the previous evaluation that the article has absolutely no relevance to the query.', 'eval': 0}


Evaluating articles:  19%|█▉        | 19/100 [04:44<22:23, 16.58s/it]

Article: 'Fourier transform detection of weak optical transitions with cyclic
  routines'
 Classification: {'explanation': "i agree with the previous evaluation that the article is not directly related to transformer-based models or information retrieval. however, i think the previous evaluation is too harsh. the article does mention the fourier transform, which is a mathematical concept that has connections to signal processing and analysis. while it's true that the article's application is in a completely different field, the fourier transform itself could be seen as a tangential connection to the query. therefore, i would rate the relevance as 1, indicating a very slight relevance.", 'eval': 1}


Evaluating articles:  20%|██        | 20/100 [05:01<22:15, 16.69s/it]

Article: 'sBSNN: Stochastic-Bits Enabled Binary Spiking Neural Network with
  On-Chip Learning for Energy Efficient Neuromorphic Computing at the Edge'
 Classification: {'explanation': 'i agree with the previous evaluation that the article is not directly related to the query about transformer-based models for optimizing ranked list truncation in information retrieval. the article discusses a specific type of neural network architecture (sbsnn) and its application to image recognition tasks, which is unrelated to the topic of transformer-based models and ranked list truncation in information retrieval. however, both articles deal with neural networks and computing, which share a similar topic. therefore, i would rate this article a 1, as it is only very slightly relevant to the query.', 'eval': 1}


Evaluating articles:  21%|██        | 21/100 [05:15<20:45, 15.77s/it]

Article: 'Which Generation Shows the Most Prudent Data Sharing Behaviour?'
 Classification: {'explanation': 'i agree with the previous evaluation that the article is not directly related to the query about transformer-based models for optimizing ranked list truncation in information retrieval. the article is about a study on data sharing behavior and attitudes among different age groups, which is a completely different topic. however, i would rate the relevance as 1 instead of 0, as both topics are related to data and information, and the article does touch on data sharing behavior, which shares a similar theme with the query. however, the connection is very weak and the article does not provide any insights or relevance to the specific query.', 'eval': 1}


Evaluating articles:  22%|██▏       | 22/100 [05:31<20:39, 15.89s/it]

Article: 'A New Charter of Ethics and Rights of Artificial Consciousness in a
  Human World'
 Classification: {'explanation': 'i agree with the previous evaluation. the article discusses artificial consciousness, ethics, and rights, which is unrelated to transformer-based models and information retrieval. there is no mention of these topics in the article, and the query is not even tangentially related to the content.', 'eval': 0}


Evaluating articles:  23%|██▎       | 23/100 [05:47<20:24, 15.91s/it]

Article: 'X-ray measurement model incorporating energy-correlated material
  variability and its application in information-theoretic system analysis'
 Classification: {'explanation': "i agree with the previous evaluation that the topics of the article and the query are unrelated. the article focuses on x-ray measurement models and their application in analyzing x-ray imaging and sensing systems, while the query is about transformer-based models for optimizing ranked list truncation in information retrieval. there is no mention of transformers, ranked list truncation, or information retrieval in the article. however, i would rate the relevance as 1 instead of 0, since both topics share a common theme of 'analysis' and 'performance optimization', albeit in different domains.", 'eval': 1}


Evaluating articles:  24%|██▍       | 24/100 [05:57<18:12, 14.38s/it]

Article: 'Superconductor-metal quantum transition at the EuO-KTaO3 interface'
 Classification: {'explanation': 'i agree with the previous evaluation. the article discusses superconductivity and quantum physics, with no mention of transformer-based models, information retrieval, or ranked list truncation. the topics are completely unrelated, and there is no connection between the article and the query.', 'eval': 0}


Evaluating articles:  25%|██▌       | 25/100 [06:21<21:22, 17.10s/it]

Article: 'Efficient Inverse-Free Incremental and Decremental Algorithms for
  Multiple Hidden Nodes in Extreme Learning Machine'
 Classification: {'explanation': 'i completely agree with the previous evaluation. the article discusses extreme learning machine (elm) and its variants, which is a type of neural network, whereas the query mentions transformer-based models for optimizing ranked list truncation in information retrieval. the two topics seem to be unrelated, and there is no mention of transformers, information retrieval, or ranked list truncation in the article. therefore, i concur that the article has absolutely no relevance to the query.', 'eval': 0}


Evaluating articles:  26%|██▌       | 26/100 [06:47<24:19, 19.72s/it]

Article: 'Fingerprints of giant planets in the composition of solar twins'
 Classification: {'explanation': 'i agree with the previous evaluation. the article is discussing planetary formation and astrobiology, which is a completely unrelated topic to the query that is about transformer-based models for optimizing ranked list truncation in information retrieval, which is a topic in the field of computer science and natural language processing. there is no connection or similarity between the two topics, making the article irrelevant to the query.', 'eval': 0}


Evaluating articles:  27%|██▋       | 27/100 [07:05<23:30, 19.32s/it]

Article: 'Few-Shot Adaptation of Generative Adversarial Networks'
 Classification: {'explanation': "i agree with the previous evaluation that the article is not relevant to the query. the article discusses adapting generative adversarial networks (gans) for few-shot image synthesis, which is unrelated to the query about transformer-based models for optimizing ranked list truncation in information retrieval. there is no mention of transformers, ranked list truncation, or information retrieval in the article. however, i would rate the article's relevance as 1 instead of 0, as both topics belong to the broader field of artificial intelligence and machine learning, sharing a similar theme.", 'eval': 1}
Error when parsing feedback: Expecting value: line 1 column 1 (char 0)


Evaluating articles:  28%|██▊       | 28/100 [07:28<24:30, 20.42s/it]

Article: 'Lamina-specific neuronal properties promote robust, stable signal
  propagation in feedforward networks'
 Classification: {'explanation': "while the article is indeed focused on neural networks in the context of neuroscience, and the query appears to be unrelated, i disagree with the previous evaluation of 0. the article does mention 'information transmission' and 'information processing', which are concepts that are also relevant in the context of natural language processing and computer science. although the connection is tenuous, it's not entirely non-existent. therefore, i would rate the relevance of this article as 1, indicating that the article is only very slightly relevant to the query, sharing at most a similar topic.", 'eval': 1}


Evaluating articles:  29%|██▉       | 29/100 [07:54<25:58, 21.95s/it]

Article: 'BCFT entanglement entropy at large central charge and the black hole
  interior'
 Classification: {'explanation': 'i agree with the previous evaluation. the article is discussing concepts in theoretical physics, such as entanglement entropy, boundary conformal field theory, and black hole physics, which are unrelated to transformer-based models for optimizing ranked list truncation in information retrieval. the topics, terminology, and methods used in the article are completely distinct from the query, indicating a complete lack of relevance.', 'eval': 0}
Error when parsing feedback: Expecting value: line 1 column 1 (char 0)


Evaluating articles:  30%|███       | 30/100 [08:13<24:45, 21.22s/it]

Article: 'Longitudinal tension and mechanical stability of a pressurized straw
  tube'
 Classification: {'explanation': "i agree with the previous evaluation that the article is not directly related to transformer-based models or optimization of ranked list truncation in information retrieval. the article discusses straw tubes, mechanical properties, and particle detectors, which seems unrelated to the query. however, i wouldn't rate it as 0, since the article still shares a common theme of scientific methodology and research, which could be considered as slightly relevant. hence, i would rate it as 1, indicating that the article is only very slightly relevant to the query.", 'eval': 1}


Evaluating articles:  31%|███       | 31/100 [08:30<22:54, 19.93s/it]

Article: 'MeshAdv: Adversarial Meshes for Visual Recognition'
 Classification: {'explanation': "i agree with the previous evaluation that the article is not directly related to the query about transformer-based models for optimizing ranked list truncation in information retrieval. the article focuses on adversarial meshes and 3d shape manipulation for attacking deep neural networks, which is a distinct topic from the query. however, i wouldn't rate it as 0 because the article does mention deep neural networks, which are related to transformer-based models. although the connection is weak, it's not entirely absent.", 'eval': 1}


Evaluating articles:  32%|███▏      | 32/100 [08:53<23:39, 20.87s/it]

Article: 'Automatic Segmentation, Feature Extraction and Comparison of Healthy and
  Stroke Cerebral Vasculature'
 Classification: {'explanation': "i agree with the previous evaluation. the article discusses a method for automated segmentation and feature extraction of cerebral vasculature, which is a topic unrelated to the query about transformer-based models for optimizing ranked list truncation in information retrieval. there is no overlap or connection between the two topics, and the article does not mention any of the keywords from the query. while the article's methodology might be interesting from a general computer science perspective, it has no direct relevance to the query.", 'eval': 0}


Evaluating articles:  33%|███▎      | 33/100 [09:21<25:40, 23.00s/it]

Article: 'How Phonotactics Affect Multilingual and Zero-shot ASR Performance'
 Classification: {'explanation': 'i agree with the previous evaluation that the topics of the article and the query are unrelated. the article focuses on automatic speech recognition and phonotactics, while the query is about transformer-based models for optimizing ranked list truncation in information retrieval. there is no mention of information retrieval, ranked list truncation, or optimization in the article, making it irrelevant to the query.', 'eval': 0}


Evaluating articles:  34%|███▍      | 34/100 [09:29<20:09, 18.33s/it]

Article: 'Constraining annihilating dark matter by radio continuum spectrum of the
  Large Magellanic Cloud'
 Classification: {'explanation': 'the article discusses dark matter annihilation signals in the large magellanic cloud, which is a topic in astrophysics. the query is about transformer-based models for optimizing ranked list truncation in information retrieval, which is a topic in natural language processing and information retrieval. the two topics are completely unrelated, and the article does not mention anything related to the query. therefore, i agree with the previous evaluation that the article is not relevant to the query.', 'eval': 0}


Evaluating articles:  35%|███▌      | 35/100 [09:51<21:05, 19.47s/it]

Article: 'Contrastive Learning with Adversarial Examples'
 Classification: {'explanation': 'i agree with the previous evaluation that the article is not directly relevant to the query about transformer-based models for optimizing ranked list truncation in information retrieval. the article focuses on contrastive learning and self-supervised learning in computer vision, which is a distinct topic from the query. however, i would rate the relevance as 1 instead of 0 because both topics are related to machine learning and share some general concepts, such as deep learning and optimization. this shared context creates a slight connection between the two, even if they are not directly related.', 'eval': 1}


Evaluating articles:  36%|███▌      | 36/100 [10:07<19:41, 18.46s/it]

Article: 'DeeBERT: Dynamic Early Exiting for Accelerating BERT Inference'
 Classification: {'explanation': "i agree with the previous evaluation that the article is relevant but not entirely relevant to the query. the article discusses optimizing transformer-based models, specifically bert, which aligns with the query's topic. however, the article's focus is on accelerating bert inference in general, rather than specifically on ranked list truncation in information retrieval. while there is a connection between the article's topic and the query, the specific application mentioned in the query is not the main focus of the article.", 'eval': 2}


Evaluating articles:  37%|███▋      | 37/100 [10:26<19:32, 18.61s/it]

Article: 'Listening for Sirens: Locating and Classifying Acoustic Alarms in City
  Scenes'
 Classification: {'explanation': 'the article is about acoustic event detection and sound source localization in an urban scenario, specifically focusing on identifying and locating horns and sirens of emergency vehicles. it has no relation to transformer-based models or optimizing ranked list truncation in information retrieval, which are concepts related to natural language processing and information retrieval. the content of the article and the query are unrelated, but they both involve processing and analysis of signals, albeit different types (acoustic vs. textual). this faint connection justifies a relevance level of 1.', 'eval': 1}


Evaluating articles:  38%|███▊      | 38/100 [10:36<16:38, 16.10s/it]

Article: 'Transient chaotic dimensionality expansion by recurrent networks'
 Classification: {'explanation': "i agree with the previous evaluation that the article is not directly related to transformer-based models or optimizing ranked list truncation in information retrieval. the article discusses neural networks and chaos theory, which seem to be unrelated to the query. however, as the article is about neural networks, which are a fundamental concept in ai and machine learning, i wouldn't rate it a 0, since it's possible that some future research could explore the application of chaos theory in neural networks to optimization tasks in information retrieval. hence, i would rate it a 1, indicating that the article is only very slightly relevant to the query.", 'eval': 1}
Error when parsing feedback: Expecting value: line 1 column 1 (char 0)


Evaluating articles:  39%|███▉      | 39/100 [11:03<19:35, 19.27s/it]

Article: 'Ergodic Achievable Rate Maximization of RIS-assisted Millimeter-Wave
  MIMO-OFDM Communication Systems'
 Classification: {'explanation': 'i agree with the previous evaluation that the article is completely unrelated to the query, which is about transformer-based models for optimizing ranked list truncation in information retrieval. the article discusses reconfigurable intelligent surface (ris) assisted millimeter-wave mimo-ofdm communication systems, which is a topic in wireless communication, whereas the query is in the domain of information retrieval. there is no mention of transformers, ranked list truncation, or information retrieval in the article, making it irrelevant to the query.', 'eval': 0}


Evaluating articles:  40%|████      | 40/100 [11:12<16:26, 16.44s/it]

Article: 'DeFuzz: Deep Learning Guided Directed Fuzzing'
 Classification: {'explanation': 'i agree with the previous evaluation that the article is not directly related to the query. the article focuses on deep learning guided fuzzing for software vulnerability detection, while the query is about transformer-based models for optimizing ranked list truncation in information retrieval. although both topics involve deep learning, the application domains and specific topics are distinct. however, i would argue that the article is slightly more relevant than a complete mismatch, as it demonstrates the application of deep learning in a different domain. therefore, i would rate the relevance as 1.', 'eval': 1}


Evaluating articles:  41%|████      | 41/100 [11:28<15:45, 16.02s/it]

Article: 'Inherently stable effective field theory for dark energy and modified
  gravity'
 Classification: {'explanation': 'i agree with the previous evaluation that the article is completely unrelated to the query, which is about transformer-based models for optimizing ranked list truncation in information retrieval. the article is focused on cosmology and theoretical physics, discussing effective field theory for dark energy and modified gravity. there is no apparent connection or overlap between the two topics. while the article is well-written and discusses a specific area of research, it is not relevant to the query.', 'eval': 0}


Evaluating articles:  42%|████▏     | 42/100 [11:35<12:59, 13.43s/it]

Article: 'On complexity of representations of quivers'
 Classification: {'explanation': 'i agree with the previous evaluation that the article has no connection to transformer-based models or information retrieval, which are the main topics of the query. the article is focused on algebraic representations and quivers, which is a completely different field of study. there is no mention of machine learning, natural language processing, or information retrieval in the article. therefore, i concur that the relevance of this article to the query is very low.', 'eval': 0}


Evaluating articles:  43%|████▎     | 43/100 [11:46<12:11, 12.83s/it]

Article: 'Quantum Formation of Primordial Black holes'
 Classification: {'explanation': 'the article is about quantum mechanics and primordial black holes, which has no relation to transformer-based models or ranked list truncation in information retrieval. the topics are completely different and unrelated, making the article not relevant to the query.', 'eval': 0}


Evaluating articles:  44%|████▍     | 44/100 [12:08<14:28, 15.51s/it]

Article: 'Tree Reconstruction using Topology Optimisation'
 Classification: {'explanation': 'i agree with the previous evaluation. the article focuses on tree reconstruction using topology optimization, which is unrelated to transformer-based models and optimizing ranked list truncation in information retrieval. the topics, keywords, and concepts discussed in the article do not overlap with the query, making it irrelevant to the query.', 'eval': 0}


Evaluating articles:  45%|████▌     | 45/100 [12:20<13:21, 14.58s/it]

Article: 'Deep Learning for Ultra-Reliable and Low-Latency Communications in 6G
  Networks'
 Classification: {'explanation': 'i completely agree with the previous evaluation. the article focuses on the application of deep learning techniques in 6g networks, specifically urllc, with no mention of transformer-based models, ranked list truncation, or information retrieval, which are the key concepts in the query. the topics are indeed unrelated, making the article not relevant to the query.', 'eval': 0}


Evaluating articles:  46%|████▌     | 46/100 [12:45<15:53, 17.65s/it]

Article: 'Active galactic nuclei ghosts: A systematic search for faded nuclei'
 Classification: {'explanation': "the article is about active galactic nuclei and their evolution, discussing the fading and rising of their activity. it is unrelated to the topic of transformer-based models for optimizing ranked list truncation in information retrieval. the content is about astrophysics, and there is no connection to the query. however, i wouldn't rate it as 0 because it's still a research article discussing a scientific topic, and in a very broad sense, it shares a similar general topic of scientific research with the query. but it's still very far from being relevant to the query.", 'eval': 1}
Error when parsing feedback: Expecting value: line 1 column 1 (char 0)


Evaluating articles:  47%|████▋     | 47/100 [13:08<16:55, 19.16s/it]

Article: 'Nonbinary Error-Detecting Hybrid Codes'
 Classification: {'explanation': "i agree with the previous evaluation. the article discusses quantum computing and coding theory, which is unrelated to transformer-based models and ranked list truncation in information retrieval. the topics are distinct and do not share any apparent connections. while the article does mention 'information' in the context of classical information transmission, it is not related to the 'information retrieval' mentioned in the query. therefore, i concur that the article has no relevance to the query.", 'eval': 0}


Evaluating articles:  48%|████▊     | 48/100 [13:25<16:05, 18.57s/it]

Article: 'Interactive Movement Primitives: Planning to Push Occluding Pieces for
  Fruit Picking'
 Classification: {'explanation': 'i agree with the previous evaluation that the article and the query are unrelated. the article focuses on robotic technology and fruit picking, while the query is about transformer-based models for optimizing ranked list truncation in information retrieval. there is no overlap or similarity between the two topics. the article does not mention transformers, ranked list truncation, or information retrieval in any way. therefore, i conclude that the article is not relevant to the query.', 'eval': 0}


Evaluating articles:  49%|████▉     | 49/100 [13:49<17:03, 20.07s/it]

Article: 'Pb-doped p-type Bi$_2$Se$_3$ thin films via interfacial engineering'
 Classification: {'explanation': 'the article is about pb-doped p-type bi2se3 thin films and its properties, which has no connection to transformer-based models or optimizing ranked list truncation in information retrieval. the topics are completely unrelated, making the article irrelevant to the query.', 'eval': 0}


Evaluating articles:  50%|█████     | 50/100 [14:05<15:38, 18.78s/it]

Article: 'Growth of nonsymmetric operads'
 Classification: {'explanation': 'i agree with the previous evaluation. the article is about nonsymmetric operads, a mathematical concept, and has no connection to transformer-based models or information retrieval, which are topics in computer science and natural language processing. the content of the article does not share any similarities with the query, making it completely irrelevant.', 'eval': 0}


Evaluating articles:  51%|█████     | 51/100 [14:25<15:49, 19.38s/it]

Article: 'Optimizing Electric Multiple Unit Circulation Plan within Maintenance
  Constraints for High-Speed Railway System'
 Classification: {'explanation': 'i agree with the previous evaluation that the article is not directly related to the query. the article focuses on optimizing emu circulation plans for high-speed railways, which is unrelated to transformer-based models for optimizing ranked list truncation in information retrieval. while both topics involve optimization, the domains and techniques used are completely different. however, i would rate it as 1 instead of 0 because the article does involve optimization, which shares a slight connection with the query.', 'eval': 1}
Error when parsing feedback: Expecting value: line 1 column 1 (char 0)


Evaluating articles:  52%|█████▏    | 52/100 [14:55<17:58, 22.46s/it]

Article: 'Near-field imaging of surface-plasmon vortex-modes around a single
  elliptical nanohole in a gold film'
 Classification: {'explanation': 'i agree with the previous evaluation that the article is not related to the query about transformer-based models for optimizing ranked list truncation in information retrieval. the article is focused on surface plasmon modes and nanoholes in a gold film, which is a completely different field of study. the language, concepts, and techniques used in the article are distinct from those in the query, indicating a lack of relevance. however, i would rate the relevance as 1 instead of 0, as the article is still a scientific/academic paper, and there might be some general, high-level connections between the two fields, such as the use of mathematical models or computational methods. but these connections are too vague and indirect to imply any significant relevance.', 'eval': 1}


Evaluating articles:  53%|█████▎    | 53/100 [15:05<14:34, 18.61s/it]

Article: 'Driven translocation of a semiflexible polymer through a conical channel
  in the presence of attractive surface interactions'
 Classification: {'explanation': "the article is about the translocation of a semiflexible polymer through a conical channel, which has no apparent connection to transformer-based models or optimizing ranked list truncation in information retrieval. the topics and fields of study are completely unrelated, making it difficult to find any relevance between the two. however, i wouldn't classify it as a 0 since the article does touch on concepts like dynamics and optimization, albeit in a completely different context. therefore, i would evaluate the article's relevance to the query as 1.", 'eval': 1}


Evaluating articles:  54%|█████▍    | 54/100 [15:17<12:56, 16.87s/it]

Article: 'The Accuracy of Restricted Boltzmann Machine Models of Ising Systems'
 Classification: {'explanation': "i agree with the previous evaluation that the article is not related to the query. the article focuses on restricted boltzmann machine models of ising systems, which is a topic in statistical physics, whereas the query is about transformer-based models for optimizing ranked list truncation in information retrieval, which is a topic in natural language processing. there is no overlap between the content of the article and the query. however, i wouldn't rate it as 0 because the article is still a machine learning/modeling topic, albeit in a different domain. therefore, i would rate it as 1, indicating that the article shares a similar topic (machine learning/models) but is not relevant to the query.", 'eval': 1}
Error when parsing feedback: Expecting value: line 1 column 1 (char 0)


Evaluating articles:  55%|█████▌    | 55/100 [15:44<14:45, 19.69s/it]

Article: 'See saw mechanism with Yukawa alignment for neutrinos'
 Classification: {'explanation': 'i concur with the previous evaluation that the article is unrelated to the query, which focuses on transformer-based models for optimizing ranked list truncation in information retrieval. the article, on the other hand, discusses a seesaw mechanism with yukawa alignment for neutrinos, which is a topic in particle physics. there is no apparent connection between the two, and the technical terms and concepts used in the article are not related to the query. the relevance is therefore very low.', 'eval': 0}


Evaluating articles:  56%|█████▌    | 56/100 [16:03<14:15, 19.44s/it]

Article: 'Game Values of Strong Placement Games'
 Classification: {'explanation': 'i agree with the previous evaluation that the article is unrelated to the query about transformer-based models for optimizing ranked list truncation in information retrieval. the article discusses game theory and simplicial complexes, which are far removed from the topics of natural language processing and information retrieval. there is no apparent connection between the two topics, and the language and concepts used in the article are not relevant to the query. however, i would rate this article a 1 instead of 0, as it shares a similar topic in the sense that both game theory and information retrieval involve abstract structures and mathematical concepts, even if they are not directly related.', 'eval': 1}


Evaluating articles:  57%|█████▋    | 57/100 [16:14<12:17, 17.16s/it]

Article: 'On the centralizer of vector fields: criteria of triviality and
  genericity results'
 Classification: {'explanation': 'the article is about vector fields and riemannian manifolds, which is a completely different topic from transformer-based models and ranked list truncation in information retrieval. there is no mention of transformers, information retrieval, or ranked lists in the article. the previous evaluation of 0 is correct, as the article is not relevant to the query at all.', 'eval': 0}


Evaluating articles:  58%|█████▊    | 58/100 [16:40<13:51, 19.79s/it]

Article: 'Attacks Which Do Not Kill Training Make Adversarial Learning Stronger'
 Classification: {'explanation': "i agree with the previous evaluation that the article is not directly related to the query topics of transformer-based models, optimizing ranked list truncation, or information retrieval. the article focuses on adversarial training and robustness in machine learning, which seems to be a different domain. however, i wouldn't say the article has absolutely no relevance, as both topics are related to machine learning and optimization techniques. therefore, i would rate the relevance as 1, indicating a slight relevance due to the shared domain of machine learning.", 'eval': 1}


Evaluating articles:  59%|█████▉    | 59/100 [17:05<14:34, 21.32s/it]

Article: 'SymNMF-Net for The Symmetric NMF Problem'
 Classification: {'explanation': "i agree with the previous evaluation. the article is about symmetric non-negative matrix factorization (symnmf) and proposes a neural network called symnmf-net to solve the symnmf problem, which has no relation to transformer-based models, ranked list truncation, or information retrieval. the topics are completely different, and there is no mention of the query's keywords in the article.", 'eval': 0}


Evaluating articles:  60%|██████    | 60/100 [17:22<13:14, 19.87s/it]

Article: 'Vibrational Heat-Bath Configuration Interaction'
 Classification: {'explanation': "i completely agree with the previous evaluation. the article discusses a method for calculating vibrational eigenstates in anharmonic systems, which is a topic in physics or chemistry, whereas the query is about transformer-based models for optimizing ranked list truncation in information retrieval, which is a topic in natural language processing and information retrieval. there is no connection between the two topics, and the article does not mention any of the keywords from the query. the article's content is completely unrelated to the query.", 'eval': 0}


Evaluating articles:  61%|██████    | 61/100 [17:37<12:07, 18.64s/it]

Article: 'A unified view of space-time covariance functions through Gelfand pairs'
 Classification: {'explanation': 'i agree with the previous evaluation. the article discusses gelfand pairs and their application to spatio-temporal statistics, which has no apparent connection to transformer-based models, ranked list truncation, or information retrieval. the topics are completely unrelated, and the article does not mention any relevant keywords related to the query.', 'eval': 0}


Evaluating articles:  62%|██████▏   | 62/100 [17:50<10:35, 16.72s/it]

Article: 'Grasping as Inference: Reactive Grasping in Heavily Cluttered
  Environment'
 Classification: {'explanation': 'i agree with the previous evaluation that the article is not relevant to the query. the article discusses grasping and robotics, which is a completely different topic from transformer-based models for optimizing ranked list truncation in information retrieval. there is no mention of transformers, natural language processing, or information retrieval in the article. therefore, the article has absolutely no relevance to the query.', 'eval': 0}


Evaluating articles:  63%|██████▎   | 63/100 [18:08<10:37, 17.24s/it]

Article: 'The Case for Learning Application Behavior to Improve Hardware Energy
  Efficiency'
 Classification: {'explanation': 'i partially agree with the previous evaluation. although the topics seem different at first glance, both the article and the query are related to the field of computer science and involve the use of deep learning models. however, the specific applications and goals are distinct, and there is no direct connection between optimizing hardware energy efficiency and ranked list truncation in information retrieval. therefore, i would rate the relevance as 1, indicating that the article is only slightly relevant to the query, sharing a similar topic but not directly related.', 'eval': 1}


Evaluating articles:  64%|██████▍   | 64/100 [18:22<09:46, 16.29s/it]

Article: 'Cost-Optimal Laser-Accelerated Lightsails'
 Classification: {'explanation': 'i completely agree with the previous evaluation. the article discusses laser-accelerated lightsails and their applications in space missions, which is entirely unrelated to the query about transformer-based models for optimizing ranked list truncation in information retrieval. there is no mention of transformers, models, optimization, or information retrieval in the article, and the content of the article has no connection to the query. the topics are completely disparate, and the article does not provide any relevant information or insights that could be applicable to the query.', 'eval': 0}


Evaluating articles:  65%|██████▌   | 65/100 [18:44<10:26, 17.89s/it]

Article: 'Nonreciprocal directional dichroism induced by a temperature gradient as
  a probe for mobile spin dynamics in quantum magnets'
 Classification: {'explanation': "the article is about quantum magnets and experimental probes, which is unrelated to transformer-based models for optimizing ranked list truncation in information retrieval. the topics are completely different, and there is no mention of transformers, ranked lists, or information retrieval in the article. however, i wouldn't say it has 'absolutely no relevance' since both topics are related to scientific research, so i'll give it a 1.", 'eval': 1}


Evaluating articles:  66%|██████▌   | 66/100 [19:06<10:50, 19.15s/it]

Article: 'A broadband achromatic polarization-insensitive metalens consisting of
  anisotropic nanostructures'
 Classification: {'explanation': 'i agree with the previous evaluation that the article has absolutely no relevance to the query. the article discusses metasurfaces, metalenses, and optical devices, which are unrelated to the topic of transformer-based models for optimizing ranked list truncation in information retrieval. the two subjects belong to different fields, namely optics and natural language processing, with no overlap or similarity. therefore, the article has no relevance to the query.', 'eval': 0}


Evaluating articles:  67%|██████▋   | 67/100 [19:26<10:36, 19.28s/it]

Article: 'Asymptotic Expansions of The Traces of the Thermoelastic Operators'
 Classification: {'explanation': 'the article is about asymptotic expansions of thermoelastic operators in riemannian manifolds, which is a topic in mathematics and physics that has no apparent connection to transformer-based models or information retrieval. the query is about optimizing ranked list truncation in information retrieval using transformer-based models, which is a topic in natural language processing and machine learning. there is no shared topic or keyword between the article and the query, making the article irrelevant to the query.', 'eval': 0}


Evaluating articles:  68%|██████▊   | 68/100 [19:42<09:51, 18.49s/it]

Article: 'On Eventually Periodic Sets as Minimal Additive Complements'
 Classification: {'explanation': 'the article discusses additive complements in abelian groups, specifically focusing on eventually periodic sets, which is a topic in abstract algebra. the query, on the other hand, is about transformer-based models for optimizing ranked list truncation in information retrieval, which is a topic in artificial intelligence and natural language processing. these two topics are unrelated, and there is no connection between the concepts discussed in the article and the query. therefore, i agree with the previous evaluation.', 'eval': 0}


Evaluating articles:  69%|██████▉   | 69/100 [20:03<09:53, 19.14s/it]

Article: 'Two-phonon structures for beta-decay theory'
 Classification: {'explanation': 'i agree with the previous evaluation of 0 because the article is completely unrelated to the query. the article discusses beta-decay theory and nuclear physics, while the query is about transformer-based models for optimizing ranked list truncation in information retrieval. there is no mention of transformers, information retrieval, or ranked list truncation in the article, and the concepts discussed are entirely different from the query.', 'eval': 0}


Evaluating articles:  70%|███████   | 70/100 [20:17<08:45, 17.52s/it]

Article: 'Symbiotic Child Emotional Support with Social Robots and Temporal
  Knowledge Graphs'
 Classification: {'explanation': "the article discusses the development of a symbiotic framework for real-time emotional support with social robots and knowledge graphs, which has no apparent connection to the query about transformer-based models for optimizing ranked list truncation in information retrieval. the topics are unrelated, and the article does not mention anything about information retrieval or transformer-based models. however, since the article is focused on a specific application of ai in child emotional support, i wouldn't rate it as a 0 because it still shares a very general connection to ai and machine learning, which might be marginally related to the query. therefore, i would rate it as a 1, indicating very slight relevance.", 'eval': 1}


Evaluating articles:  71%|███████   | 71/100 [20:29<07:39, 15.86s/it]

Article: 'High Tc superconductivity in heavy Rare Earth Hydrides: correlation
  between the presence of the f states on the Fermi surface, nesting and the
  value of Tc'
 Classification: {'explanation': 'i agree with the previous evaluation that the article has no relevance to the query. the article is about superconductivity in rare earth hydrides, which is a topic in materials science, whereas the query is about transformer-based models for optimizing ranked list truncation in information retrieval, which is a topic in natural language processing and information retrieval. there is no overlap or connection between the two topics, making the article completely irrelevant to the query.', 'eval': 0}


Evaluating articles:  72%|███████▏  | 72/100 [20:40<06:43, 14.40s/it]

Article: 'Diffusion in the presence of correlated dynamical disorder and coherent
  exciton transfer in the non-Markovian limit'
 Classification: {'explanation': 'the article is not related to transformer-based models or optimizing ranked list truncation in information retrieval, which are topics in natural language processing and information retrieval. the article is focused on quantum systems, hamiltonian, and quantum coherence, which are concepts from physics. therefore, i agree that the article has no relevance to the query.', 'eval': 0}


Evaluating articles:  73%|███████▎  | 73/100 [21:00<07:14, 16.10s/it]

Article: 'Continuous-time multi-state capture-recapture models'
 Classification: {'explanation': "i agree with the previous evaluation that the article is not relevant to the query. the article is about continuous-time multi-state capture-recapture models, which is a topic in statistics and biology, whereas the query is about transformer-based models for optimizing ranked list truncation in information retrieval, which is a topic in natural language processing and computer science. there is no connection or similarity between the two topics, making the article irrelevant to the query. however, i wouldn't rate it as 0 because the article does contain some technical terms and concepts that could be potentially related to optimization techniques, although in a very indirect way. therefore, i would rate the relevance as 1, indicating that the article is only very slightly relevant to the query, sharing at most a similar topic.", 'eval': 1}


Evaluating articles:  74%|███████▍  | 74/100 [21:17<07:12, 16.63s/it]

Article: 'A panoramic landscape of the Sagittarius stream in Gaia DR2 revealed
  with the STREAMFINDER spyglass'
 Classification: {'explanation': 'i agree with the previous evaluation that the article is completely unrelated to the query. the article discusses astronomy and the sagittarius stream, while the query is about transformer-based models for optimizing ranked list truncation in information retrieval. there is no connection between the two topics, making the article irrelevant to the query.', 'eval': 0}


Evaluating articles:  75%|███████▌  | 75/100 [21:34<06:51, 16.47s/it]

Article: 'Application of the iterative reconstruction to simulated galaxy fields'
 Classification: {'explanation': 'the article discusses the application of an iterative reconstruction method to galaxy mocks in redshift space, which has no direct relation to transformer-based models or optimizing ranked list truncation in information retrieval. the topics and fields studied are completely different, with the article focusing on astrophysics and galaxy simulations, while the query is related to natural language processing and information retrieval. although both topics involve computational methods, there is no conceptual overlap or connection between the two.', 'eval': 0}
Error when parsing feedback: Expecting value: line 1 column 1 (char 0)


Evaluating articles:  76%|███████▌  | 76/100 [22:01<07:54, 19.75s/it]

Article: 'Model Watermarking for Image Processing Networks'
 Classification: {'explanation': "i agree with the previous evaluation that the article is not directly related to transformer-based models or ranked list truncation in information retrieval. however, i would argue that the article's focus on deep learning models and their protection could be remotely relevant to the query, especially since it discusses model intellectual property protection, which might be tangentially related to models used in information retrieval. therefore, i would rate the relevance as 1, indicating a slight connection but not a direct relevance.", 'eval': 1}


Evaluating articles:  77%|███████▋  | 77/100 [22:19<07:25, 19.36s/it]

Article: 'Numerical approximation of elliptic problems with log-normal random
  coefficients'
 Classification: {'explanation': 'i agree with the previous evaluation that the article is not relevant to the query. the article discusses numerical approximation of elliptic problems with log-normal random coefficients, which is a completely different topic from transformer-based models for optimizing ranked list truncation in information retrieval. there is no connection or similarity between the two topics. the article does not mention transformers, optimization, ranked lists, truncation, or information retrieval at all.', 'eval': 0}


Evaluating articles:  78%|███████▊  | 78/100 [22:29<06:01, 16.43s/it]

Article: 'A search for cosmological anisotropy using the Lyman alpha forest from
  SDSS quasar spectra'
 Classification: {'explanation': "the article is about cosmological anisotropy and the lyman alpha forest, while the query is about transformer-based models for optimizing ranked list truncation in information retrieval. the topics are unrelated, but they both fall under the broad category of data analysis. since the article doesn't mention anything about machine learning, transformers, or information retrieval, i agree with the previous evaluation that the article is not relevant to the query. however, i wouldn't say it has absolutely no relevance, as both topics involve data analysis and interpretation. hence, i would give a slightly higher evaluation.", 'eval': 1}


Evaluating articles:  79%|███████▉  | 79/100 [22:47<05:54, 16.87s/it]

Article: 'An Inertial Block Majorization Minimization Framework for Nonsmooth
  Nonconvex Optimization'
 Classification: {'explanation': 'i agree with the previous evaluation. the article discusses a novel framework for nonsmooth nonconvex optimization problems, which is unrelated to transformer-based models for optimizing ranked list truncation in information retrieval. the topics seem to be from different domains, and the article does not mention key terms from the query such as transformers, information retrieval, or ranked list truncation. however, i would rate the relevance as 1 instead of 0, as both topics share a connection to machine learning and optimization, albeit in different contexts.', 'eval': 1}


Evaluating articles:  80%|████████  | 80/100 [22:53<04:34, 13.73s/it]

Article: 'Big Quantum cohomology of orbifold spheres'
 Classification: {'explanation': "the article is about constructing a kodaira-spencer map in the context of algebraic geometry, which has no apparent connection to transformer-based models or information retrieval. the topics discussed are unrelated, and the query terms do not appear in the article. however, it's clear that the article is discussing a specific mathematical concept, and it's not entirely impossible that some future research could bridge the gap between this topic and information retrieval. hence, i don't evaluate it as 0, but rather as a very low relevance.", 'eval': 1}


Evaluating articles:  81%|████████  | 81/100 [23:05<04:10, 13.19s/it]

Article: 'Synchrotron radiation from a charge circulating around a cylinder with
  negative permittivity'
 Classification: {'explanation': 'i agree with the previous evaluation. the article is focused on electromagnetism and radiation, discussing concepts like dielectric permittivity and synchrotron radiation, which are entirely unrelated to transformer-based models, ranked lists, truncation, and information retrieval. there is no mention of the key terms in the query, making it clear that the article is not relevant to the query.', 'eval': 0}


Evaluating articles:  82%|████████▏ | 82/100 [23:16<03:44, 12.49s/it]

Article: 'Novel Cascaded Gaussian Mixture Model-Deep Neural Network Classifier for
  Speaker Identification in Emotional Talking Environments'
 Classification: {'explanation': "i concur with the previous evaluation that the article is not relevant to the query about transformer-based models for optimizing ranked list truncation in information retrieval. the article discusses speaker identification using gaussian mixture model-deep neural network classifier, which is unrelated to the query topic. however, since the article is still related to deep learning and neural networks, i wouldn't say it has absolutely no relevance. hence, i would rate it a 1, indicating a slight relevance due to the shared topic of deep learning, but no direct connection to the query.", 'eval': 1}
Error when parsing feedback: Expecting value: line 1 column 1 (char 0)


Evaluating articles:  83%|████████▎ | 83/100 [23:38<04:18, 15.21s/it]

Article: 'A Note About the {Ki(z)} Functions'
 Classification: {'explanation': 'i agree with the previous evaluation. the article discusses mathematical properties of the ki(z) functions, which has no apparent connection to transformer-based models or information retrieval. the topics are unrelated, and there is no overlap between the two.', 'eval': 0}


Evaluating articles:  84%|████████▍ | 84/100 [23:48<03:42, 13.88s/it]

Article: 'Understanding Metrics for Paraphrasing'
 Classification: {'explanation': "i agree with the previous evaluation that the article is not directly related to the query about transformer-based models for optimizing ranked list truncation in information retrieval. however, i don't think it's completely irrelevant. the article discusses natural language generation and metrics for evaluating paraphrasing quality, which might have some indirect connections to information retrieval, although it's a stretch. hence, i would rate the relevance as 1, indicating that the article is only very slightly relevant to the query, sharing at most a similar topic.", 'eval': 1}


Evaluating articles:  85%|████████▌ | 85/100 [24:05<03:38, 14.59s/it]

Article: 'Single Crystal Growth of Cuprate Superconductor
  (Lu$_{0.8}$Nd$_{0.2}$)Ba$_2$Cu$_4$O$_8$ by KOH Flux Method'
 Classification: {'explanation': 'the article discusses the growth of single crystals of a cuprate superconductor using the koh flux method, and its structural and superconducting properties. the query, on the other hand, is about transformer-based models for optimizing ranked list truncation in information retrieval. there is no mention of transformers, models, optimization, ranked lists, or information retrieval in the article. the topics are entirely unrelated, and the article does not even share a similar topic with the query. however, i would not give it a 0, as the article does contain technical information and scientific jargon, which might be slightly relevant to the general field of scientific research, which is remotely related to information retrieval.', 'eval': 1}


Evaluating articles:  86%|████████▌ | 86/100 [24:23<03:40, 15.78s/it]

Article: 'Nonlinear Stochastic Trajectory Optimization for Centroidal Momentum
  Motion Generation of Legged Robots'
 Classification: {'explanation': 'i agree with the previous evaluation that the article has no relevance to the query. the article discusses trajectory optimization for legged robots, which is a topic in robotics and control systems, whereas the query is about transformer-based models for optimizing ranked list truncation in information retrieval, which is a topic in natural language processing and information retrieval. the two topics are unrelated, and the article does not mention anything related to the query.', 'eval': 0}


Evaluating articles:  87%|████████▋ | 87/100 [24:38<03:21, 15.49s/it]

Article: 'Leveraging Causal Inference for Explainable Automatic Program Repair'
 Classification: {'explanation': 'i agree with the previous evaluation that the article is not directly related to the query about transformer-based models for optimizing ranked list truncation in information retrieval. however, i think the relevance is not a complete 0 because both topics involve some common concepts like sequence-to-sequence models and the idea of optimizing/truncating output. although the domains and specific techniques are different, there might be some indirect connections or inspiration that could be drawn between the two areas. hence, i would rate the relevance as 1.', 'eval': 1}


Evaluating articles:  88%|████████▊ | 88/100 [24:56<03:15, 16.30s/it]

Article: 'Temporal Attention-Augmented Graph Convolutional Network for Efficient
  Skeleton-Based Human Action Recognition'
 Classification: {'explanation': "i agree with the previous evaluation that the article is not related to the query. the article discusses a graph convolutional network approach for skeleton-based human action recognition, which is a topic in computer vision and machine learning, whereas the query mentions transformer-based models for optimizing ranked list truncation in information retrieval, which is a topic in natural language processing and information retrieval. there is no apparent connection between the two topics. however, i wouldn't rate it as a 0, as the article still shares a general connection to machine learning and neural networks, which are related to the query's topic of transformer-based models. therefore, i would rate it as 1, indicating that the article is only very slightly relevant to the query, sharing a similar broad topic.", 'eval': 1}


Evaluating articles:  89%|████████▉ | 89/100 [25:19<03:21, 18.36s/it]

Article: 'Control Design of Autonomous Drone Using Deep Learning Based Image
  Understanding Techniques'
 Classification: {'explanation': 'i agree with the previous evaluation that the article is not relevant to the query. the article discusses autonomous drone control using deep learning-based image understanding techniques, which is unrelated to transformer-based models for optimizing ranked list truncation in information retrieval. the topics are distinct and do not share any commonalities.', 'eval': 0}


Evaluating articles:  90%|█████████ | 90/100 [25:26<02:28, 14.81s/it]

Article: 'Rigidity for rigid analytic motives'
 Classification: {'explanation': 'the article is about motives in algebraic geometry and number theory, while the query is about transformer-based models for optimizing ranked list truncation in information retrieval. the two topics are unrelated, and there is no mention of transformers, information retrieval, or ranked list truncation in the article. however, the article is about a specific mathematical concept, and the query is about a specific application of ai in information retrieval. while the topics are vastly different, they both belong to the realm of academia and research. therefore, i would rate the relevance as 1, indicating that the article is only very slightly relevant to the query, sharing at most a similar topic.', 'eval': 1}


Evaluating articles:  91%|█████████ | 91/100 [25:47<02:29, 16.66s/it]

Article: 'Sizing the White Whale'
 Classification: {'explanation': 'i agree with the previous evaluation that the article appears to be discussing mathematical concepts unrelated to the query. the topics of zonotopes, minkowski sums, and hyperplane arrangements do not seem to have any connection to transformer-based models, ranked list truncation, or information retrieval. the article does not mention any relevant keywords or concepts related to the query.', 'eval': 0}


Evaluating articles:  92%|█████████▏| 92/100 [26:06<02:18, 17.31s/it]

Article: 'Regularized maximal fidelity of the generalized Pauli channels'
 Classification: {'explanation': 'i agree with the previous evaluation. the article is about asymptotic regularization of the maximal fidelity for the generalized pauli channels, which is a topic in quantum information theory. the query is about transformer-based models for optimizing ranked list truncation in information retrieval, which is a topic in natural language processing and information retrieval. there is no apparent connection between the two topics, making the article completely irrelevant to the query.', 'eval': 0}


Evaluating articles:  93%|█████████▎| 93/100 [26:15<01:45, 15.04s/it]

Article: 'Fighting Contextual Bandits with Stochastic Smoothing'
 Classification: {'explanation': "i agree with the previous evaluation that the article is not directly related to the query about transformer-based models for optimizing ranked list truncation in information retrieval. the article discusses adversarial contextual bandit problems and stochastic smoothing, which is a different topic. there is no mention of transformers, ranked list truncation, or information retrieval in the article. however, i would rate the relevance as 1 instead of 0, as the article is still about a machine learning-related topic, even if it's not directly related to the query.", 'eval': 1}


Evaluating articles:  94%|█████████▍| 94/100 [26:32<01:33, 15.59s/it]

Article: 'Acute Lymphoblastic Leukemia Detection Using Hypercomplex-Valued
  Convolutional Neural Networks'
 Classification: {'explanation': 'i agree with the previous evaluation that the article is not directly related to the query, which is about transformer-based models for optimizing ranked list truncation in information retrieval. the article focuses on convolutional neural networks for image classification in medical diagnosis, which is a different topic in a different domain. however, i would rate the relevance as 1 instead of 0, as both topics share a common thread of machine learning and deep learning techniques, even though the application domains are different.', 'eval': 1}


Evaluating articles:  95%|█████████▌| 95/100 [26:46<01:15, 15.02s/it]

Article: 'The profinite completion of relatively hyperbolic virtually special
  groups'
 Classification: {'explanation': 'i fully agree with the previous evaluation. the article is a mathematical paper that deals with group theory and topology, which is completely unrelated to the query that involves transformer-based models and information retrieval. the terminology and content of the article are entirely different from the query, making it irrelevant.', 'eval': 0}


Evaluating articles:  96%|█████████▌| 96/100 [27:03<01:02, 15.53s/it]

Article: 'On-Shell Electric-Magnetic Duality and the Dual Graviton'
 Classification: {'explanation': 'i agree with the previous evaluation that the article is completely unrelated to the query about transformer-based models for optimizing ranked list truncation in information retrieval. the article discusses advanced concepts in physics, such as electric-magnetic duality, gravitons, and scattering amplitudes, which have no apparent connection to the query. the language, terminology, and concepts used in the article are distinct from those in the query, indicating a lack of relevance.', 'eval': 0}


Evaluating articles:  97%|█████████▋| 97/100 [27:15<00:44, 14.69s/it]

Article: 'A stationary heat conduction problem'
 Classification: {'explanation': "i agree with the previous evaluation that the article is not directly related to transformer-based models or ranked list truncation in information retrieval. the article is focused on a mathematical physics topic, specifically a stationary heat conduction problem, which is a vastly different domain from the query. however, i wouldn't rate it as a complete 0, as the article does involve mathematical concepts and problem-solving, which are indirectly related to the general field of algorithms and models used in information retrieval. hence, i rate it as a 1, indicating a very slight relevance.", 'eval': 1}


Evaluating articles:  98%|█████████▊| 98/100 [27:23<00:24, 12.49s/it]

Article: 'Small-mass naked singularities censored by the Higgs field'
 Classification: {'explanation': 'the article is about vacuum decay and singularities in physics, while the query is about optimizing ranked list truncation in information retrieval using transformer-based models. there is no connection between the two topics. the article does not mention transformers, models, ranking, or truncation, and the query does not mention physics, singularities, or vacuum decay.', 'eval': 0}


Evaluating articles:  99%|█████████▉| 99/100 [27:44<00:15, 15.20s/it]

Article: 'Thermal Instability of Halo Gas Heated by Streaming Cosmic Rays'
 Classification: {'explanation': 'i agree with the previous evaluation that the article is unrelated to the query. the article discusses thermal instability of halo gas heated by cosmic rays, which is a topic in astrophysics, whereas the query is about transformer-based models for optimizing ranked list truncation in information retrieval, which is a topic in natural language processing and computer science. there is no connection between the two topics.', 'eval': 0}


Evaluating articles: 100%|██████████| 100/100 [28:01<00:00, 16.82s/it]

Article: 'Choppy: Cut Transformer For Ranked List Truncation'
 Classification: {'explanation': "the article is highly relevant to the query as it proposes a transformer-based model, choppy, specifically designed to optimize ranked list truncation in information retrieval, which aligns perfectly with the query. the model's architecture, based on the transformer architecture, and its ability to optimize user-defined ir metrics, make it a strong match for the query.", 'eval': 3}





In [115]:
evaluated_levels_df = pd.DataFrame(evaluated)

In [116]:
evaluated_levels_df[evaluated_levels_df['eval'] >= 2]

Unnamed: 0,title,abstract,eval
35,DeeBERT: Dynamic Early Exiting for Acceleratin...,Large-scale pre-trained language models such...,2
99,Choppy: Cut Transformer For Ranked List Trunca...,Work in information retrieval has traditiona...,3


In [117]:
evaluated_levels_df[evaluated_levels_df['eval'] >= 1]

Unnamed: 0,title,abstract,eval
1,Deep Convolutional Neural Networks Model-based...,Diagnosing Brain Tumor with the aid of Magne...,1
2,A Theory-Based Evaluation of Nearest Neighbor ...,In the $k$-nearest neighborhood model ($k$-N...,1
5,Integration of Blockchain and Edge Computing i...,As an important technology to ensure data se...,1
6,Multi-fidelity power flow solver,We propose a multi-fidelity neural network (...,1
7,Automatic Detection of ECG Abnormalities by us...,Heart disease is one of the most common dise...,1
15,Don't shoot butterfly with rifles: Multi-chann...,With its strong modeling capacity that comes...,1
18,Fourier transform detection of weak optical tr...,We demonstrate a means of detecting weak opt...,1
19,sBSNN: Stochastic-Bits Enabled Binary Spiking ...,"In this work, we propose stochastic Binary S...",1
20,Which Generation Shows the Most Prudent Data S...,We report from a study performed in ten Euro...,1
22,X-ray measurement model incorporating energy-c...,"Extending our prior work, we propose a multi...",1


In [118]:
evaluated_levels_df['eval'].value_counts()

0    56
1    42
2     1
3     1
Name: eval, dtype: int64