### Pipeline test ###

In this notebook we will try a possible textual claim generation to be implemented later as part of the package

In [3]:
from hydra.core.global_hydra import GlobalHydra
from hydra import initialize,compose
from src.evidence import FeverousRetrieverRandom
from src.pipeline import ClaimGeneratorPipeline
from src.claim import FeverousGenerator
from src.claim import ToTToGenerator
from src.claim import TextualClaim
import numpy as np
import tensorflow_text
import json
import tensorflow as tf

tf.get_logger().setLevel('ERROR')
GlobalHydra.instance().clear()
initialize(config_path='../src/config/', job_name="test_app")

hydra.initialize()

In [4]:
cfg = compose(config_name="config_pipeline")
rng = np.random.default_rng(cfg.seed)
retrievers = [FeverousRetrieverRandom(p_dataset=cfg.notebook.data_path,
                                    num_positive=10,
                                    num_negative=0,
                                    wrong_cell=2,
                                    table_per_page=cfg.table_per_page,
                                    evidence_per_table=cfg.evidence_per_table,
                                    column_per_table=cfg.column_per_table,
                                    seed=44,
                                    key_strategy=strat,
                                    verbose=True
                                    ) for strat in ['entity']]


generator1 = FeverousGenerator(encoding='compact', model_path='../models/t5_train_feverous.bin')
#generator2 = ToTToGenerator(encoding='totto', model_path='../models/exported_totto_large/1648208035')
generator3 = ToTToGenerator(encoding='compact', model_path='../models/exported_totto_large/1648208035', verbose=True)

generators = [generator3]

pipeline = ClaimGeneratorPipeline([retrievers,generators])
claims = pipeline.generate() # Right now, FeverousRetriever doesn't support an input table


json_evidence = TextualClaim.to_json(claims)
with open('data.json', 'w', encoding='utf-8') as f:
    json.dump(json_evidence, f, ensure_ascii=False, indent=4)



INFO logger 2022-06-02 22:05:09,490 | feverous_retriever.py:115 | b' wikipage: Carrot soup'
INFO logger 2022-06-02 22:05:09,519 | feverous_retriever.py:115 | b' wikipage: Rhytiphora obscura'
INFO logger 2022-06-02 22:05:09,523 | feverous_retriever.py:115 | b' wikipage: Tired Eyes Slowly Burning'
INFO logger 2022-06-02 22:05:09,524 | feverous_retriever.py:115 | b' wikipage: Vadia (Narmada)'
INFO logger 2022-06-02 22:05:09,527 | feverous_retriever.py:115 | b' wikipage: Saint-Hubert Air Base'
INFO logger 2022-06-02 22:05:09,529 | feverous_retriever.py:115 | b' wikipage: Megachile rambutwan'
INFO logger 2022-06-02 22:05:09,531 | feverous_retriever.py:115 | b' wikipage: Manfred Hellmann'
INFO logger 2022-06-02 22:05:09,534 | feverous_retriever.py:115 | b' wikipage: Richard Do\xcc\x88cker'
INFO logger 2022-06-02 22:05:09,535 | feverous_retriever.py:115 | b' wikipage: 1949 Western Michigan Broncos football team'
INFO logger 2022-06-02 22:05:10,387 | feverous_retriever_random.py:124 | b"Page: 

KeyboardInterrupt: 