Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
23 commits
Select commit Hold shift + click to select a range
ed832ca
feat(pkg): start of MCP sim package
TomMonks Aug 1, 2025
a3abce3
feat(pkg): +Protocol to adapt sim model interface
TomMonks Aug 1, 2025
b6db7c5
feat(examples): call_centre_model
TomMonks Aug 1, 2025
0932d42
feat(server): added generic sim mcp server code
TomMonks Aug 1, 2025
8039f93
clean(self_ref): removed commented out models
TomMonks Aug 1, 2025
8b69a76
feat(call_centre): renamed adapter class
TomMonks Aug 1, 2025
783e516
feat(mcp): setup script to run new framework
TomMonks Aug 1, 2025
87a17d0
fix(planner): memory stores schema under get_schema
TomMonks Aug 7, 2025
1f119cc
feat(planner): shorten plan preview to 500 charac
TomMonks Aug 7, 2025
66bfbd4
chore(clean): removed original mcp and model modules
TomMonks Aug 7, 2025
68491f8
chore(clean): removed redun top level resource dir
TomMonks Aug 7, 2025
eeb0dc4
docs(readme): updated run mcp instructio
TomMonks Aug 7, 2025
ef412b0
docs(env): +arize-phoenix
TomMonks Aug 11, 2025
6c43aae
feat(evals): added basic langgraph tracing arize-phoenix
TomMonks Aug 11, 2025
0176218
feat(evals): draft tracing
TomMonks Aug 12, 2025
1073cbe
feat(evals): added initial eval data
TomMonks Aug 12, 2025
aa70d86
feat(evals): added basic eval script
TomMonks Aug 12, 2025
1e15020
feat(evals): trial run with gemma3:27b - no phoenix
TomMonks Aug 12, 2025
5f896a6
docs(env) + main arize-phoenix
TomMonks Aug 12, 2025
42c7a8b
feat(evals): run all evals in one go or limit to n of set
TomMonks Aug 12, 2025
56a08f8
feat(callcentre): improved schema desc + improved json prompt
TomMonks Aug 12, 2025
b832d9d
feat(evals): create script now uploads to phoenix as dataset
TomMonks Aug 13, 2025
6476f76
feat(app): draft of a basic streamlit app
TomMonks Sep 30, 2025
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion README.md
Original file line number Diff line number Diff line change
Expand Up @@ -127,7 +127,7 @@ This project was developed and tested on the following system configuration:

1. **Start the MCP server**
```bash
python mcp_server.py
python run_call_centre_server.py
```
Server will be available at `http://localhost:8001/mcp`

Expand Down
7 changes: 4 additions & 3 deletions agent_planning_workflow.py
Original file line number Diff line number Diff line change
Expand Up @@ -438,12 +438,13 @@ async def run_plan(

prompt = prompt_map[step_name]
# Most prompts need schema, user input
schema = memory.get("get_experiment_parameter_schema")
schema = memory.get("get_schema")
result = await client.get_prompt(
prompt.name, {"schema": schema, "user_input": user_input}
)
llm_prompt_text = result.messages[0].content.text
# Actually run LLM (synchronously!)

# run the prompt
llm_result = llm.invoke(llm_prompt_text)
parameters = json.loads(clean_llm_response(llm_result))
memory["parameters"] = parameters
Expand Down Expand Up @@ -551,7 +552,7 @@ async def main(
transient=True, # Removes progress bar after completion
) as progress:
task = progress.add_task("executing", total=None)
memory = await run_plan(plan_steps, features, llm, user_input)
memory = await run_plan(plan_steps, features, llm, user_input, debug_mode)
progress.remove_task(task)

# 4. Results
Expand Down
16 changes: 1 addition & 15 deletions agent_self_reflection.py
Original file line number Diff line number Diff line change
Expand Up @@ -34,7 +34,7 @@
Hard constraints
-------------
MAX_RETRIES : int
Maximum number of parameter generation attempts before bailout (default: 4)
Maximum number of parameter generation attempts before bailout (default: mam4)

Examples
--------
Expand Down Expand Up @@ -445,20 +445,6 @@ def parse_arguments():

if __name__ == "__main__":

# TM notes: mistral:7b can fail and successed with reflection (or 2nd go)
# qwen2:math:7b is not suitable
# gemma3:27b both variants work well
# deepseek-r1:32b is too slow on 4080

#model_name = "gemma3n:e4b"
#model_name = "deepseek-r1:32b"
#model_name = "llama3:latest"
#model_name = "llama3.1:8b"
#model_name = "gemma3:27b"
# model_name = "gemma3:27b-it-qat"
#model_name = "qwen2-math:7b"
#model_name = "mistral:7b"

# Parse command line arguments
args = parse_arguments()

Expand Down
Loading