diff --git a/docs/astro.config.mjs b/docs/astro.config.mjs index 7e868faa27..7bcdfc67e2 100644 --- a/docs/astro.config.mjs +++ b/docs/astro.config.mjs @@ -304,7 +304,7 @@ export default defineConfig({ { label: 'MemoryOps', link: '/guides/memoryops/' }, { label: 'MultiRepoOps', link: '/patterns/multi-repo-ops/' }, { label: 'Monitoring', link: '/patterns/monitoring/' }, - { label: 'Agentic Observability Kit', link: '/patterns/agentic-observability-kit/' }, + { label: 'Agentic Ops', link: '/patterns/agentic-ops/' }, { label: 'Orchestration', link: '/patterns/orchestration/' }, { label: 'ProjectOps', link: '/patterns/project-ops/' }, { label: 'ResearchPlanAssignOps', link: '/patterns/research-plan-assign-ops/' }, diff --git a/docs/src/content/docs/patterns/agentic-ops.md b/docs/src/content/docs/patterns/agentic-ops.md new file mode 100644 index 0000000000..d6911e3156 --- /dev/null +++ b/docs/src/content/docs/patterns/agentic-ops.md @@ -0,0 +1,33 @@ +--- +title: Agentic Ops +description: Monitor agentic workflows across a repository, publish observability reports, and escalate recurring failures or waste. +sidebar: + badge: { text: 'Observability', variant: 'tip' } +--- + +Use this pattern when you want a scheduled workflow to inspect other agentic workflows, summarize what happened, and escalate unusual cost or failure patterns. + +The [agentic-ops repository](https://github.com/githubnext/agentic-ops) provides the reference implementation for this approach. + +## What this pattern does + +This pattern reviews workflow logs across a repository, classifies notable behavior, and publishes a structured report. When it detects repeated failures, abnormal token consumption, or other unhealthy patterns, it can escalate those findings into issues for follow-up. + +This pattern is useful for repository-wide monitoring because it creates a durable operational record instead of relying on ad hoc inspection of individual workflow runs. + +## Typical workflow + +1. Run on a schedule to collect recent workflow activity. +2. Analyze logs, costs, and failure signals across runs. +3. Post a summary report to a GitHub Discussion or another durable destination. +4. Open or update issues when the same problem crosses a threshold. + +## When to use it + +Use this pattern when a repository has enough workflow activity that maintainers need a regular summary instead of checking each run manually. It also helps when workflows span multiple teams and failures or waste need to be surfaced in a shared location. + +## Related documentation + +- [Projects & Monitoring](/gh-aw/patterns/monitoring/) for durable tracking with Projects and safe outputs +- [Custom OTLP Attributes](/gh-aw/guides/custom-otlp-attributes/) for enriching workflow telemetry +- [Audit Commands](/gh-aw/reference/audit/) for investigating individual runs and regressions