JD.AI Gateway Operations
- Type:
operations
- Kind:
OperationsIndex
- ID:
operations.jdai-gateway
- Status:
draft
- Source:
specs/operations/examples/operations.example.yaml
YAML
apiVersion: jdai.upss/v1
kind: Operations
id: operations.jdai-gateway
version: 1
status: draft
metadata:
owners:
- JerrettDavis
reviewers:
- upss-operations-runbook-agent
lastReviewed: 2026-03-07
changeReason: Establish the first canonical operational specification for the JD.AI gateway service.
service: jdai-gateway
runbooks:
- name: Gateway Health Degradation
description: Steps to diagnose and restore gateway health when latency exceeds thresholds.
triggerCondition: P95 latency exceeds 500ms for 5 consecutive minutes.
steps:
- Check gateway pod status and recent restart events.
- Review upstream dependency health endpoints.
- Inspect recent deployment changes for regressions.
- Scale gateway replicas if load-related.
- Escalate to on-call engineer if unresolved within 15 minutes.
incidentLevels:
- level: sev1
description: Complete service outage affecting all users.
responseTime: 5 minutes
- level: sev2
description: Partial degradation affecting a significant subset of users.
responseTime: 15 minutes
responseSlos:
- level: sev1
acknowledgeWithin: 5 minutes
resolveWithin: 1 hour
escalationPaths:
- level: sev1
contacts:
- on-call-primary
- engineering-lead
trace:
upstream:
- specs/vision/examples/vision.example.yaml
downstream:
governance:
- tests/JD.AI.Tests/Specifications/OperationsSpecificationRepositoryTests.cs
audits:
- src/JD.AI.Core/Specifications/OperationsSpecification.cs