Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
The table of contents is too big for display.
Diff view
Diff view
  •  
  •  
  •  
109 changes: 109 additions & 0 deletions .evolve/compare-drivers-canonical/1780163083769/lift-drivers.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,109 @@
{
"task": "structured-field-extraction (deterministic exact-match judge)",
"backend": {
"model": "deepseek-chat",
"baseUrl": "https://api.deepseek.com/v1",
"verdict": "real"
},
"pricing": {
"inPerMTokens": 0.27,
"outPerMTokens": 1.1
},
"integrity": {
"verdict": "real",
"realRecords": 176,
"stubRecords": 0,
"totalInputTokens": 16779,
"totalOutputTokens": 7175,
"diagnosis": "176 records with real LLM activity (in=16779, out=7175 tokens, $0.0124)."
},
"dataset": {
"search": 8,
"holdout": 6
},
"baselineSurface": "Extract the transaction info from the message as JSON.",
"holdoutScenarioIds": [
"h1",
"h2",
"h3",
"h4",
"h5",
"h6"
],
"scores": [
{
"name": "gepa-reflection",
"rank": 1,
"baselineComposite": 0.583,
"winnerComposite": 1,
"lift": 0.417,
"liftCi": {
"low": 0.208,
"high": 0.583
},
"costUsd": 0.00284,
"winnerSurface": "Extract the transaction info as JSON with keys: merchant, amount (bare decimal number, no currency symbol), date (ISO YYYY-MM-DD), category (one of: groceries, dining, transport, utilities, entertainment)."
},
{
"name": "skill-opt",
"rank": 2,
"baselineComposite": 0.583,
"winnerComposite": 1,
"lift": 0.417,
"liftCi": {
"low": 0.208,
"high": 0.583
},
"costUsd": 0.003507,
"winnerSurface": "Extract the transaction info from the message as JSON.\nExample: {\"merchant\": \"Starbucks\", \"amount\": 5.75, \"date\": \"2023-10-05\", \"category\": \"dining\"}\n Use keys: merchant, amount, date, category. Amount must be a bare number. Date must be ISO YYYY-MM-DD. Category must be one of: groceries, dining, transport, utilities, entertainment."
},
{
"name": "gepa-pareto",
"rank": 3,
"baselineComposite": 0.583,
"winnerComposite": 0.958,
"lift": 0.375,
"liftCi": {
"low": 0.208,
"high": 0.583
},
"costUsd": 0.002791,
"winnerSurface": "Extract the transaction info as JSON with keys: merchant (string), amount (bare decimal number, no currency), date (ISO YYYY-MM-DD), category (one of: groceries, dining, transport, utilities, entertainment)."
}
],
"best": {
"name": "gepa-reflection",
"lift": 0.417,
"liftCi": {
"low": 0.208,
"high": 0.583
}
},
"pairwise": [
{
"a": "gepa-reflection",
"b": "skill-opt",
"deltaMean": 0,
"ci": {
"low": 0,
"high": 0
},
"favored": "tie"
},
{
"a": "gepa-reflection",
"b": "gepa-pareto",
"deltaMean": 0.042,
"ci": {
"low": 0,
"high": 0.125
},
"favored": "tie"
}
],
"totalCostUsd": 0.012423,
"llmCalls": 176,
"elapsedSec": 131,
"honestVerdict": "lift-proven",
"publishedAt": "2026-05-30T17:44:43.769Z"
}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"cellId":"s1:0","scenarioId":"s1","rep":0,"artifact":{"text":"{\n \"date\": \"2024-03-03\",\n \"amount\": 42.50,\n \"merchant\": \"Whole Foods Market\",\n \"description\": \"weekly groceries\"\n}","parsed":{"date":"2024-03-03","amount":42.5,"merchant":"Whole Foods Market","description":"weekly groceries"}},"judgeScores":{"field-exact-match":{"dimensions":{"merchant":1,"amount":1,"date":1,"category":0},"composite":0.75,"notes":"parsed"}},"costUsd":0.00006049000000000001,"tokenUsage":{"input":57,"output":41},"durationMs":1312,"seed":42,"cached":false}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"name":"cost.worker","cellId":"s1:0","startMs":1780163130748,"amountUsd":0.00006049000000000001,"durationMs":0}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"cellId":"s2:0","scenarioId":"s2","rep":0,"artifact":{"text":"{\n \"merchant\": \"Uber\",\n \"amount\": 18.20,\n \"description\": \"ride downtown\",\n \"date\": \"2024-01-07\"\n}","parsed":{"merchant":"Uber","amount":18.2,"description":"ride downtown","date":"2024-01-07"}},"judgeScores":{"field-exact-match":{"dimensions":{"merchant":1,"amount":1,"date":1,"category":0},"composite":0.75,"notes":"parsed"}},"costUsd":0.00005885000000000001,"tokenUsage":{"input":55,"output":40},"durationMs":1343,"seed":43,"cached":false}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"name":"cost.worker","cellId":"s2:0","startMs":1780163130779,"amountUsd":0.00005885000000000001,"durationMs":0}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"cellId":"s3:0","scenarioId":"s3","rep":0,"artifact":{"text":"{\n \"description\": \"Dinner at Olive Garden\",\n \"amount\": 67,\n \"currency\": \"USD\",\n \"date\": \"2024-02-14\"\n}","parsed":{"description":"Dinner at Olive Garden","amount":67,"currency":"USD","date":"2024-02-14"}},"judgeScores":{"field-exact-match":{"dimensions":{"merchant":0,"amount":1,"date":1,"category":0},"composite":0.5,"notes":"parsed"}},"costUsd":0.00005721000000000001,"tokenUsage":{"input":53,"output":39},"durationMs":967,"seed":44,"cached":false}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"name":"cost.worker","cellId":"s3:0","startMs":1780163131715,"amountUsd":0.00005721000000000001,"durationMs":0}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"cellId":"s4:0","scenarioId":"s4","rep":0,"artifact":{"text":"{\n \"merchant\": \"ConEdison\",\n \"amount\": 130.99,\n \"category\": \"Utilities\",\n \"date\": \"2023-12-01\"\n}","parsed":{"merchant":"ConEdison","amount":130.99,"category":"Utilities","date":"2023-12-01"}},"judgeScores":{"field-exact-match":{"dimensions":{"merchant":1,"amount":1,"date":1,"category":1},"composite":1,"notes":"parsed"}},"costUsd":0.00005966000000000001,"tokenUsage":{"input":58,"output":40},"durationMs":1067,"seed":45,"cached":false}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"name":"cost.worker","cellId":"s4:0","startMs":1780163131847,"amountUsd":0.00005966000000000001,"durationMs":0}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"cellId":"s5:0","scenarioId":"s5","rep":0,"artifact":{"text":"{\n \"merchant\": \"AMC Theatres\",\n \"amount\": 24,\n \"date\": \"2024-04-05\",\n \"description\": \"Bought movie tickets\"\n}","parsed":{"merchant":"AMC Theatres","amount":24,"date":"2024-04-05","description":"Bought movie tickets"}},"judgeScores":{"field-exact-match":{"dimensions":{"merchant":1,"amount":1,"date":1,"category":0},"composite":0.75,"notes":"parsed"}},"costUsd":0.00006323,"tokenUsage":{"input":59,"output":43},"durationMs":1154,"seed":46,"cached":false}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"name":"cost.worker","cellId":"s5:0","startMs":1780163132868,"amountUsd":0.00006323,"durationMs":0}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"cellId":"s6:0","scenarioId":"s6","rep":0,"artifact":{"text":"{\n \"merchant\": \"Trader Joe's\",\n \"amount\": 55.10,\n \"date\": \"2024-02-28\",\n \"category\": \"produce\"\n}","parsed":{"merchant":"Trader Joe's","amount":55.1,"date":"2024-02-28","category":"produce"}},"judgeScores":{"field-exact-match":{"dimensions":{"merchant":1,"amount":1,"date":1,"category":0},"composite":0.75,"notes":"parsed"}},"costUsd":0.00006159,"tokenUsage":{"input":57,"output":42},"durationMs":1152,"seed":47,"cached":false}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"name":"cost.worker","cellId":"s6:0","startMs":1780163132999,"amountUsd":0.00006159,"durationMs":0}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"cellId":"s7:0","scenarioId":"s7","rep":0,"artifact":{"text":"{\n \"amount\": 9.75,\n \"date\": \"2024-03-19\",\n \"description\": \"airport drop-off\",\n \"merchant\": \"Lyft\"\n}","parsed":{"amount":9.75,"date":"2024-03-19","description":"airport drop-off","merchant":"Lyft"}},"judgeScores":{"field-exact-match":{"dimensions":{"merchant":1,"amount":1,"date":1,"category":0},"composite":0.75,"notes":"parsed"}},"costUsd":0.00006159,"tokenUsage":{"input":57,"output":42},"durationMs":1198,"seed":48,"cached":false}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"name":"cost.worker","cellId":"s7:0","startMs":1780163134067,"amountUsd":0.00006159,"durationMs":0}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"cellId":"s8:0","scenarioId":"s8","rep":0,"artifact":{"text":"{\n \"amount\": 15.49,\n \"currency\": \"USD\",\n \"date\": \"2024-01-22\",\n \"description\": \"Netflix monthly subscription\",\n \"type\": \"debit\"\n}","parsed":{"amount":15.49,"currency":"USD","date":"2024-01-22","description":"Netflix monthly subscription","type":"debit"}},"judgeScores":{"field-exact-match":{"dimensions":{"merchant":0,"amount":1,"date":1,"category":0},"composite":0.5,"notes":"parsed"}},"costUsd":0.00006765,"tokenUsage":{"input":55,"output":48},"durationMs":1337,"seed":49,"cached":false}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"name":"cost.worker","cellId":"s8:0","startMs":1780163134336,"amountUsd":0.00006765,"durationMs":0}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"cellId":"s1:0","scenarioId":"s1","rep":0,"artifact":{"text":"{\n \"merchant\": \"Whole Foods Market\",\n \"amount\": 42.50,\n \"date\": \"2024-03-03\",\n \"category\": \"groceries\"\n}","parsed":{"merchant":"Whole Foods Market","amount":42.5,"date":"2024-03-03","category":"groceries"}},"judgeScores":{"field-exact-match":{"dimensions":{"merchant":1,"amount":1,"date":1,"category":1},"composite":1,"notes":"parsed"}},"costUsd":0.00007158,"tokenUsage":{"input":94,"output":42},"durationMs":1415,"seed":42,"cached":false}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"name":"cost.worker","cellId":"s1:0","startMs":1780163138562,"amountUsd":0.00007158,"durationMs":0}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"cellId":"s2:0","scenarioId":"s2","rep":0,"artifact":{"text":"{\n \"merchant\": \"Uber\",\n \"amount\": 18.20,\n \"date\": \"2024-01-07\",\n \"category\": \"transport\"\n}","parsed":{"merchant":"Uber","amount":18.2,"date":"2024-01-07","category":"transport"}},"judgeScores":{"field-exact-match":{"dimensions":{"merchant":1,"amount":1,"date":1,"category":1},"composite":1,"notes":"parsed"}},"costUsd":0.00006774000000000001,"tokenUsage":{"input":92,"output":39},"durationMs":1306,"seed":43,"cached":false}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"name":"cost.worker","cellId":"s2:0","startMs":1780163138454,"amountUsd":0.00006774000000000001,"durationMs":0}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"cellId":"s3:0","scenarioId":"s3","rep":0,"artifact":{"text":"{\n \"merchant\": \"Olive Garden\",\n \"amount\": 67,\n \"date\": \"2024-02-14\",\n \"category\": \"dining\"\n}","parsed":{"merchant":"Olive Garden","amount":67,"date":"2024-02-14","category":"dining"}},"judgeScores":{"field-exact-match":{"dimensions":{"merchant":1,"amount":1,"date":1,"category":1},"composite":1,"notes":"parsed"}},"costUsd":0.00006720000000000001,"tokenUsage":{"input":90,"output":39},"durationMs":1042,"seed":44,"cached":false}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"name":"cost.worker","cellId":"s3:0","startMs":1780163139496,"amountUsd":0.00006720000000000001,"durationMs":0}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"cellId":"s4:0","scenarioId":"s4","rep":0,"artifact":{"text":"{\n \"merchant\": \"ConEdison\",\n \"amount\": 130.99,\n \"date\": \"2023-12-01\",\n \"category\": \"utilities\"\n}","parsed":{"merchant":"ConEdison","amount":130.99,"date":"2023-12-01","category":"utilities"}},"judgeScores":{"field-exact-match":{"dimensions":{"merchant":1,"amount":1,"date":1,"category":1},"composite":1,"notes":"parsed"}},"costUsd":0.00007075000000000001,"tokenUsage":{"input":95,"output":41},"durationMs":1128,"seed":45,"cached":false}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"name":"cost.worker","cellId":"s4:0","startMs":1780163139689,"amountUsd":0.00007075000000000001,"durationMs":0}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"cellId":"s5:0","scenarioId":"s5","rep":0,"artifact":{"text":"{\n \"merchant\": \"AMC Theatres\",\n \"amount\": 24,\n \"date\": \"2024-04-05\",\n \"category\": \"entertainment\"\n}","parsed":{"merchant":"AMC Theatres","amount":24,"date":"2024-04-05","category":"entertainment"}},"judgeScores":{"field-exact-match":{"dimensions":{"merchant":1,"amount":1,"date":1,"category":1},"composite":1,"notes":"parsed"}},"costUsd":0.00007212000000000001,"tokenUsage":{"input":96,"output":42},"durationMs":1345,"seed":46,"cached":false}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"name":"cost.worker","cellId":"s5:0","startMs":1780163140840,"amountUsd":0.00007212000000000001,"durationMs":0}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"cellId":"s6:0","scenarioId":"s6","rep":0,"artifact":{"text":"{\n \"merchant\": \"Trader Joe's\",\n \"amount\": 55.10,\n \"date\": \"2024-02-28\",\n \"category\": \"groceries\"\n}","parsed":{"merchant":"Trader Joe's","amount":55.1,"date":"2024-02-28","category":"groceries"}},"judgeScores":{"field-exact-match":{"dimensions":{"merchant":1,"amount":1,"date":1,"category":1},"composite":1,"notes":"parsed"}},"costUsd":0.00007268,"tokenUsage":{"input":94,"output":43},"durationMs":1299,"seed":47,"cached":false}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"name":"cost.worker","cellId":"s6:0","startMs":1780163140989,"amountUsd":0.00007268,"durationMs":0}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"cellId":"s7:0","scenarioId":"s7","rep":0,"artifact":{"text":"{\n \"merchant\": \"Lyft\",\n \"amount\": 9.75,\n \"date\": \"2024-03-19\",\n \"category\": \"transport\"\n}","parsed":{"merchant":"Lyft","amount":9.75,"date":"2024-03-19","category":"transport"}},"judgeScores":{"field-exact-match":{"dimensions":{"merchant":1,"amount":1,"date":1,"category":1},"composite":1,"notes":"parsed"}},"costUsd":0.00006828,"tokenUsage":{"input":94,"output":39},"durationMs":1294,"seed":48,"cached":false}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"name":"cost.worker","cellId":"s7:0","startMs":1780163142134,"amountUsd":0.00006828,"durationMs":0}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"cellId":"s8:0","scenarioId":"s8","rep":0,"artifact":{"text":"{\n \"merchant\": \"Netflix\",\n \"amount\": 15.49,\n \"date\": \"2024-01-22\",\n \"category\": \"entertainment\"\n}","parsed":{"merchant":"Netflix","amount":15.49,"date":"2024-01-22","category":"entertainment"}},"judgeScores":{"field-exact-match":{"dimensions":{"merchant":1,"amount":1,"date":1,"category":1},"composite":1,"notes":"parsed"}},"costUsd":0.00006994000000000001,"tokenUsage":{"input":92,"output":41},"durationMs":1253,"seed":49,"cached":false}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"name":"cost.worker","cellId":"s8:0","startMs":1780163142242,"amountUsd":0.00006994000000000001,"durationMs":0}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"cellId":"s1:0","scenarioId":"s1","rep":0,"artifact":{"text":"{\n \"merchant\": \"Whole Foods Market\",\n \"amount\": 42.50,\n \"date\": \"2024-03-03\",\n \"category\": \"groceries\"\n}","parsed":{"merchant":"Whole Foods Market","amount":42.5,"date":"2024-03-03","category":"groceries"}},"judgeScores":{"field-exact-match":{"dimensions":{"merchant":1,"amount":1,"date":1,"category":1},"composite":1,"notes":"parsed"}},"costUsd":0.00006861,"tokenUsage":{"input":83,"output":42},"durationMs":1004,"seed":42,"cached":false}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"name":"cost.worker","cellId":"s1:0","startMs":1780163143246,"amountUsd":0.00006861,"durationMs":0}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"cellId":"s2:0","scenarioId":"s2","rep":0,"artifact":{"text":"{\n \"merchant\": \"Uber\",\n \"amount\": 18.20,\n \"date\": \"2024-01-07\",\n \"category\": \"transport\"\n}","parsed":{"merchant":"Uber","amount":18.2,"date":"2024-01-07","category":"transport"}},"judgeScores":{"field-exact-match":{"dimensions":{"merchant":1,"amount":1,"date":1,"category":1},"composite":1,"notes":"parsed"}},"costUsd":0.00006477,"tokenUsage":{"input":81,"output":39},"durationMs":1357,"seed":43,"cached":false}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"name":"cost.worker","cellId":"s2:0","startMs":1780163143599,"amountUsd":0.00006477,"durationMs":0}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"cellId":"s3:0","scenarioId":"s3","rep":0,"artifact":{"text":"{\n \"merchant\": \"Olive Garden\",\n \"amount\": 67,\n \"date\": \"2024-02-14\",\n \"category\": \"dining\"\n}","parsed":{"merchant":"Olive Garden","amount":67,"date":"2024-02-14","category":"dining"}},"judgeScores":{"field-exact-match":{"dimensions":{"merchant":1,"amount":1,"date":1,"category":1},"composite":1,"notes":"parsed"}},"costUsd":0.00006423,"tokenUsage":{"input":79,"output":39},"durationMs":1337,"seed":44,"cached":false}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"name":"cost.worker","cellId":"s3:0","startMs":1780163144583,"amountUsd":0.00006423,"durationMs":0}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"cellId":"s4:0","scenarioId":"s4","rep":0,"artifact":{"text":"{\n \"merchant\": \"ConEdison\",\n \"amount\": 130.99,\n \"date\": \"2023-12-01\",\n \"category\": \"utilities\"\n}","parsed":{"merchant":"ConEdison","amount":130.99,"date":"2023-12-01","category":"utilities"}},"judgeScores":{"field-exact-match":{"dimensions":{"merchant":1,"amount":1,"date":1,"category":1},"composite":1,"notes":"parsed"}},"costUsd":0.00006778,"tokenUsage":{"input":84,"output":41},"durationMs":1393,"seed":45,"cached":false}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"name":"cost.worker","cellId":"s4:0","startMs":1780163144993,"amountUsd":0.00006778,"durationMs":0}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"cellId":"s5:0","scenarioId":"s5","rep":0,"artifact":{"text":"{\n \"merchant\": \"AMC Theatres\",\n \"amount\": 24,\n \"date\": \"2024-04-05\",\n \"category\": \"entertainment\"\n}","parsed":{"merchant":"AMC Theatres","amount":24,"date":"2024-04-05","category":"entertainment"}},"judgeScores":{"field-exact-match":{"dimensions":{"merchant":1,"amount":1,"date":1,"category":1},"composite":1,"notes":"parsed"}},"costUsd":0.00006915,"tokenUsage":{"input":85,"output":42},"durationMs":1111,"seed":46,"cached":false}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"name":"cost.worker","cellId":"s5:0","startMs":1780163145695,"amountUsd":0.00006915,"durationMs":0}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"cellId":"s6:0","scenarioId":"s6","rep":0,"artifact":{"text":"{\n \"merchant\": \"Trader Joe's\",\n \"amount\": 55.10,\n \"date\": \"2024-02-28\",\n \"category\": \"groceries\"\n}","parsed":{"merchant":"Trader Joe's","amount":55.1,"date":"2024-02-28","category":"groceries"}},"judgeScores":{"field-exact-match":{"dimensions":{"merchant":1,"amount":1,"date":1,"category":1},"composite":1,"notes":"parsed"}},"costUsd":0.00006971000000000001,"tokenUsage":{"input":83,"output":43},"durationMs":1051,"seed":47,"cached":false}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"name":"cost.worker","cellId":"s6:0","startMs":1780163146044,"amountUsd":0.00006971000000000001,"durationMs":0}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"cellId":"s7:0","scenarioId":"s7","rep":0,"artifact":{"text":"{\n \"merchant\": \"Lyft\",\n \"amount\": 9.75,\n \"date\": \"2024-03-19\",\n \"category\": \"transport\"\n}","parsed":{"merchant":"Lyft","amount":9.75,"date":"2024-03-19","category":"transport"}},"judgeScores":{"field-exact-match":{"dimensions":{"merchant":1,"amount":1,"date":1,"category":1},"composite":1,"notes":"parsed"}},"costUsd":0.00006531000000000001,"tokenUsage":{"input":83,"output":39},"durationMs":1347,"seed":48,"cached":false}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"name":"cost.worker","cellId":"s7:0","startMs":1780163147042,"amountUsd":0.00006531000000000001,"durationMs":0}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"cellId":"s8:0","scenarioId":"s8","rep":0,"artifact":{"text":"{\n \"merchant\": \"Netflix\",\n \"amount\": 15.49,\n \"date\": \"2024-01-22\",\n \"category\": \"entertainment\"\n}","parsed":{"merchant":"Netflix","amount":15.49,"date":"2024-01-22","category":"entertainment"}},"judgeScores":{"field-exact-match":{"dimensions":{"merchant":1,"amount":1,"date":1,"category":1},"composite":1,"notes":"parsed"}},"costUsd":0.00006697,"tokenUsage":{"input":81,"output":41},"durationMs":1013,"seed":49,"cached":false}
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
{"name":"cost.worker","cellId":"s8:0","startMs":1780163147057,"amountUsd":0.00006697,"durationMs":0}
Loading
Loading