In [20]:
import dmpchef
import os
import json
from pathlib import Path

# Input JSON path
input_path = Path("data") / "inputs" / "input.json"
with input_path.open("r", encoding="utf-8") as f:
    data = json.load(f)

print(json.dumps(data, indent=2, ensure_ascii=False))



{
  "config": {
    "funding": {
      "agency": "NIH",
      "subagency": "NIMH"
    },
    "pipeline": {
      "rag": true,
      "llm": {
        "provider": "ollama",
        "model_name": "llama3.3:latest"
      }
    },
    "export": {
      "md": true,
      "docx": true,
      "pdf": true,
      "dmptool_json": true
    }
  },
  "inputs": {
    "research_area": "Autism and social communication",
    "research_context": "This study examines social communication and neurodevelopmental profiles in youth with autism compared to typically developing peers using behavioral, clinical, and neurobiological measures. NDA GUID elements will be collected for submission to the NIMH Data Archive (NDA).",
    "data_types": "Demographic and clinical datasets; behavioral and cognitive assessments; neuroimaging and/or physiological measures; derived variables; documentation (protocols, data dictionary, README).",
    "data_source": "IRB-approved human participant study using standardized assessm

In [21]:
# ----------------------------
# Run No-RAG 
# ----------------------------
from dmpchef.api import generate

# No-RAG:
result = generate(input_path, use_rag=False)

# Show export file paths only
print("\n Export files:")
for name, path in result["outputs"].items():
    print(f"{name}: {path}")



{"timestamp": "2026-02-12T18:40:03.534416Z", "level": "info", "event": "Config loaded successfully"}


{"llm": "llama3.3:latest", "embed": "sentence-transformers/all-MiniLM-L6-v2", "hf_cache_dir": "data/cache/hf", "local_files_only": true, "allow_download_if_missing": true, "temperature": null, "num_predict": null, "num_ctx": null, "top_p": null, "top_k": null, "timestamp": "2026-02-12T18:40:03.536442Z", "level": "info", "event": "ModelLoader initialized"}
{"llm": "llama3.3:latest", "rag_default": true, "data_pdfs": "data\\database", "index_dir": "data\\index", "debug_dir": "data\\outputs\\debug", "force_rebuild_index": false, "timestamp": "2026-02-12T18:40:03.545440Z", "level": "info", "event": "DMPPipeline initialized"}
{"funding_agency": "NIH", "prompt_type": "nih_dmp", "template_md": "data\\inputs\\dmp-template.md", "retrieval_hint": "NIH Data Management and Sharing Plan (DMSP) guidance", "timestamp": "2026-02-12T18:40:03.545440Z", "level": "info", "event": "Funding agency selected"}
{"mode": "norag", "use_rag_input": false, "rag_default": true, "use_rag_final": false, "timestamp": 


 Export files:
markdown: C:\Users\Nahid\dmpchef\data\outputs\markdown\request__norag__llama3.3_latest.md
dmptool_json: C:\Users\Nahid\dmpchef\data\outputs\json\request__norag__llama3.3_latest.dmptool.json
docx: C:\Users\Nahid\dmpchef\data\outputs\docx\request__norag__llama3.3_latest.docx
pdf: C:\Users\Nahid\dmpchef\data\outputs\pdf\request__norag__llama3.3_latest.pdf





In [None]:
# ----------------------------
# Run RAG 
# ----------------------------
from dmpchef.api import generate

# RAG:
result = generate(input_path, use_rag=True)

# Show export file paths only
print("\n Export files:")
for name, path in result["outputs"].items():
    print(f"{name}: {path}")


{"timestamp": "2026-02-12T18:41:14.394435Z", "level": "info", "event": "Config loaded successfully"}
{"llm": "llama3.3:latest", "embed": "sentence-transformers/all-MiniLM-L6-v2", "hf_cache_dir": "data/cache/hf", "local_files_only": true, "allow_download_if_missing": true, "temperature": null, "num_predict": null, "num_ctx": null, "top_p": null, "top_k": null, "timestamp": "2026-02-12T18:41:14.395436Z", "level": "info", "event": "ModelLoader initialized"}
{"llm": "llama3.3:latest", "rag_default": true, "data_pdfs": "data\\database", "index_dir": "data\\index", "debug_dir": "data\\outputs\\debug", "force_rebuild_index": false, "timestamp": "2026-02-12T18:41:14.404434Z", "level": "info", "event": "DMPPipeline initialized"}
{"funding_agency": "NIH", "prompt_type": "nih_dmp", "template_md": "data\\inputs\\dmp-template.md", "retrieval_hint": "NIH Data Management and Sharing Plan (DMSP) guidance", "timestamp": "2026-02-12T18:41:14.405434Z", "level": "info", "event": "Funding agency selected"}