From 2d32d142a0baecce380b4bcdfb456b8cfc11e989 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Tom=20D=C3=B6rr?= <tomdoerr96@gmail.com>
Date: Tue, 16 Apr 2024 01:16:08 +0200
Subject: [PATCH] Add missing gold_passages_retrieved function

---
 docs/docs/tutorials/simplified-baleen.md | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/docs/docs/tutorials/simplified-baleen.md b/docs/docs/tutorials/simplified-baleen.md
index 6a7e94ca2b..71ff35bbfe 100644
--- a/docs/docs/tutorials/simplified-baleen.md
+++ b/docs/docs/tutorials/simplified-baleen.md
@@ -193,6 +193,14 @@ Let's now define our evaluation function and compare the performance of the unco
 ```python
 from dspy.evaluate.evaluate import Evaluate
 
+# Define metric to check if we retrieved the correct documents
+def gold_passages_retrieved(example, pred, trace=None):
+    gold_titles = set(map(dspy.evaluate.normalize_text, example["gold_titles"]))
+    found_titles = set(
+        map(dspy.evaluate.normalize_text, [c.split(" | ")[0] for c in pred.context])
+    )
+    return gold_titles.issubset(found_titles)
+
 # Set up the `evaluate_on_hotpotqa` function. We'll use this many times below.
 evaluate_on_hotpotqa = Evaluate(devset=devset, num_threads=1, display_progress=True, display_table=5)