In [1]:
from trectools import TrecPool, TrecRun, TrecPoolMaker

r1 = TrecRun("./robust03/runs/input.aplrob03a.gz")
r2 = TrecRun("./robust03/runs/input.UIUC03Rd1.gz")

len(r1.topics()) # 100 topics
 
# Creates document pools with r1 and r2 using different strategies:

# Strategy1: Creates a pool with top 10 documents of each run:
pool1 = TrecPoolMaker().make_pool([r1, r2], strategy="topX", topX=10) # Pool with 1636 unique documents.

# Strategy2: Creates a pool with 2000 documents (20 per topic) using the reciprocal ranking strategy by Gordon, Clake and Buettcher:
pool2 = TrecPoolMaker().make_pool([r1,r2], strategy="rrf", topX=20, rrf_den=60) # Pool with 2000 unique documents.


In [2]:
# Internally a pool is a dictionary (topicid, set(docnames))
pool1.pool

{601: {'FBIS3-12202',
  'FBIS3-22369',
  'FBIS3-38723',
  'FBIS3-42193',
  'FBIS4-1981',
  'FBIS4-44484',
  'FBIS4-64831',
  'FR940404-2-00028',
  'FT922-13069',
  'FT923-11593',
  'FT923-9764',
  'FT931-10200',
  'FT931-13722',
  'FT931-14451',
  'FT942-15268',
  'FT944-10568'},
 602: {'FT921-1623',
  'FT922-1409',
  'FT922-1498',
  'FT922-1536',
  'FT922-1680',
  'FT922-2143',
  'FT922-2288',
  'FT922-2508',
  'FT923-2408',
  'FT923-5753',
  'FT923-8609',
  'FT924-171',
  'FT934-11227',
  'FT934-11235'},
 603: {'FT922-991',
  'FT924-9307',
  'FT941-1212',
  'FT941-1443',
  'FT942-1181',
  'FT942-14179',
  'FT942-15472',
  'FT942-6205',
  'FT943-8137',
  'FT944-3264',
  'FT944-3389',
  'LA052689-0103',
  'LA072790-0059',
  'LA081990-0051',
  'LA122590-0054'},
 604: {'FBIS4-45839',
  'FBIS4-67664',
  'FR940802-1-00015',
  'FT943-12041',
  'LA061389-0087',
  'LA071989-0117',
  'LA073090-0058',
  'LA081989-0064',
  'LA092090-0248',
  'LA092690-0153',
  'LA111590-0227',
  'LA112690-0027',

In [3]:
# Check to see which pool covers better my run r1
pool1.check_coverage(r1, topX=10) 

10.0

In [4]:
pool2.check_coverage(r1, topX=10) # 8.35 

8.35

In [5]:
# Export documents to be judged using Relevation! visual assessing system
pool1.export_document_list(filename="mypool.txt", with_format="relevation")

Created mypool.txt
