In [2]:
import dmpchef
import os
import json
from pathlib import Path

# Input JSON path
input_path = Path("data") / "inputs" / "input.json"
with input_path.open("r", encoding="utf-8") as f:
    data = json.load(f)

print(json.dumps(data, indent=2, ensure_ascii=False))



{
  "config": {
    "funding": {
      "agency": "NIH",
      "subagency": "NIMH"
    },
    "pipeline": {
      "rag": false,
      "llm": {
        "provider": "ollama",
        "model_name": "llama3.3:latest"
      }
    },
    "export": {
      "md": true,
      "docx": true,
      "pdf": true,
      "dmptool_json": true
    }
  },
  "inputs": {
    "research_area": "Adolescent mental health, anxiety, and resilience mechanisms",
    "research_context": "This study investigates anxiety symptoms and resilience processes in adolescents using longitudinal behavioral, clinical, and neurobiological assessments. The project aims to identify protective and risk factors associated with mental health trajectories during adolescence.",
    "data_types": "Demographic and clinical datasets; standardized anxiety and resilience scales; behavioral task data; physiological measures (e.g., heart rate variability); derived summary variables; documentation (protocols, data dictionary, README).",
    "

In [3]:
# ----------------------------
# Run No-RAG 
# ----------------------------
from dmpchef.api import generate

# No-RAG:
result = generate(input_path, use_rag=False)

# Show export file paths only
print("\n Export files:")
for name, path in result["outputs"].items():
    print(f"{name}: {path}")



{"timestamp": "2026-02-13T18:08:06.612204Z", "level": "info", "event": "Config loaded successfully"}
{"llm": "llama3.3:latest", "embed": "sentence-transformers/all-MiniLM-L6-v2", "hf_cache_dir": "data/cache/hf", "local_files_only": true, "allow_download_if_missing": true, "temperature": null, "num_predict": null, "num_ctx": null, "top_p": null, "top_k": null, "timestamp": "2026-02-13T18:08:06.614203Z", "level": "info", "event": "ModelLoader initialized"}
{"llm": "llama3.3:latest", "rag_default": true, "data_pdfs": "data\\database", "index_dir": "data\\index", "debug_dir": "data\\outputs\\debug", "force_rebuild_index": false, "timestamp": "2026-02-13T18:08:06.622556Z", "level": "info", "event": "DMPPipeline initialized"}
{"funding_agency": "NIH", "prompt_type": "nih_dmp", "template_md": "data\\inputs\\dmp-template.md", "retrieval_hint": "NIH Data Management and Sharing Plan (DMSP) guidance", "timestamp": "2026-02-13T18:08:06.623554Z", "level": "info", "event": "Funding agency selected"}

Schema validation: PASS (input.json)


HTTP Request: POST http://127.0.0.1:11434/api/generate "HTTP/1.1 200 OK"
{"mode": "norag", "timestamp": "2026-02-13T18:09:40.492877Z", "level": "info", "event": "LLM done"}
{"mode": "norag", "output_chars": 7807, "timestamp": "2026-02-13T18:09:40.492877Z", "level": "info", "event": "DMP generation finished"}
100%|██████████| 1/1 [00:02<00:00,  2.80s/it]


 Export files:
markdown: C:\Users\Nahid\dmpchef\data\outputs\markdown\NIH_NIMH__request__norag__llama3.3_latest.md
dmptool_json: C:\Users\Nahid\dmpchef\data\outputs\json\NIH_NIMH__request__norag__llama3.3_latest.dmptool.json
docx: C:\Users\Nahid\dmpchef\data\outputs\docx\NIH_NIMH__request__norag__llama3.3_latest.docx
pdf: C:\Users\Nahid\dmpchef\data\outputs\pdf\NIH_NIMH__request__norag__llama3.3_latest.pdf





In [4]:
# ----------------------------
# Run RAG 
# ----------------------------
from dmpchef.api import generate

# RAG:
result = generate(input_path, use_rag=True)

# Show export file paths only
print("\n Export files:")
for name, path in result["outputs"].items():
    print(f"{name}: {path}")
    


{"timestamp": "2026-02-13T18:09:45.276517Z", "level": "info", "event": "Config loaded successfully"}
{"llm": "llama3.3:latest", "embed": "sentence-transformers/all-MiniLM-L6-v2", "hf_cache_dir": "data/cache/hf", "local_files_only": true, "allow_download_if_missing": true, "temperature": null, "num_predict": null, "num_ctx": null, "top_p": null, "top_k": null, "timestamp": "2026-02-13T18:09:45.277517Z", "level": "info", "event": "ModelLoader initialized"}
{"llm": "llama3.3:latest", "rag_default": true, "data_pdfs": "data\\database", "index_dir": "data\\index", "debug_dir": "data\\outputs\\debug", "force_rebuild_index": false, "timestamp": "2026-02-13T18:09:45.287027Z", "level": "info", "event": "DMPPipeline initialized"}
{"funding_agency": "NIH", "prompt_type": "nih_dmp", "template_md": "data\\inputs\\dmp-template.md", "retrieval_hint": "NIH Data Management and Sharing Plan (DMSP) guidance", "timestamp": "2026-02-13T18:09:45.288024Z", "level": "info", "event": "Funding agency selected"}

Schema validation: PASS (input.json)


Loading weights: 100%|██████████| 103/103 [00:00<00:00, 1633.18it/s, Materializing param=pooler.dense.weight]                             
[1mBertModel LOAD REPORT[0m from: sentence-transformers/all-MiniLM-L6-v2
Key                     | Status     |  | 
------------------------+------------+--+-
embeddings.position_ids | UNEXPECTED |  | 

[3mNotes:
- UNEXPECTED[3m	:can be ignored when loading from different task/architecture; not ok if you expect identical arch.[0m
{"model": "sentence-transformers/all-MiniLM-L6-v2", "cache_dir": "C:\\Users\\Nahid\\dmpchef\\data\\cache\\hf", "local_files_only": true, "timestamp": "2026-02-13T18:09:45.440448Z", "level": "info", "event": "Embeddings loaded successfully"}
{"timestamp": "2026-02-13T18:09:45.441446Z", "level": "info", "event": "Embeddings ready"}
{"index_dir": "data\\index", "force_rebuild": false, "timestamp": "2026-02-13T18:09:45.442447Z", "level": "info", "event": "Preparing FAISS vectorstore"}
{"path": "data\\index\\index.faiss", "


 Export files:
markdown: C:\Users\Nahid\dmpchef\data\outputs\markdown\NIH_NIMH__request__rag__k6__llama3.3_latest.md
dmptool_json: C:\Users\Nahid\dmpchef\data\outputs\json\NIH_NIMH__request__rag__k6__llama3.3_latest.dmptool.json
docx: C:\Users\Nahid\dmpchef\data\outputs\docx\NIH_NIMH__request__rag__k6__llama3.3_latest.docx
pdf: C:\Users\Nahid\dmpchef\data\outputs\pdf\NIH_NIMH__request__rag__k6__llama3.3_latest.pdf



