Files
2026-06-29 08:13:34 +00:00

194 lines
5.4 KiB
YAML

version: 1
kind: platform-infra-observability
metadata:
id: observability
owner: unidesk
spec: PJ2026-01060501 OTel追踪 draft-2026-06-19-p0
relatedIssues:
- 489
- 1181
defaults:
targetId: D601
images:
collector:
repository: docker.m.daocloud.io/otel/opentelemetry-collector-contrib
tag: 0.130.1
pullPolicy: IfNotPresent
tempo:
repository: docker.m.daocloud.io/grafana/tempo
tag: 2.8.1
pullPolicy: IfNotPresent
targets:
- id: D601
route: D601:k3s
namespace: platform-infra
role: active
enabled: true
createNamespace: true
- id: D518
route: D518:k3s
namespace: platform-infra
role: active
enabled: true
createNamespace: true
- id: JD01
route: JD01:k3s
namespace: platform-infra
role: active
enabled: true
createNamespace: true
collector:
deploymentName: otel-collector
serviceName: otel-collector
configMapName: otel-collector-config
replicas: 1
healthPort: 13133
otlp:
grpcPort: 4317
httpPort: 4318
traceBackend:
type: tempo
deploymentName: tempo
serviceName: tempo
configMapName: tempo-config
replicas: 1
httpPort: 3200
otlp:
grpcPort: 4317
httpPort: 4318
storage:
mode: emptyDir
retention: 24h
sampling:
mode: parentbased_traceidratio
ratio: 1
instrumentation:
contextPropagation:
- tracecontext
- baggage
serviceConnections:
- serviceName: hwlab-cloud-api
owningRepo: pikasTech/HWLAB
configRefs:
targetNode: config/hwlab-node-lanes.yaml#lanes.v03.targets.D601.node
lane: config/hwlab-node-lanes.yaml#lanes.v03.version
namespace: config/hwlab-node-lanes.yaml#lanes.v03.targets.D601.runtime.namespace
requiredSpans:
- POST /v1/agent/chat
- durable_admission
- billing_preflight
- agentrun_dispatch
- projection_write
- trace_events_read
- turn_status_read
- serviceName: hwlab-cloud-api
owningRepo: pikasTech/HWLAB
configRefs:
targetNode: config/hwlab-node-lanes.yaml#lanes.v03.targets.D518.node
lane: config/hwlab-node-lanes.yaml#lanes.v03.version
namespace: config/hwlab-node-lanes.yaml#lanes.v03.targets.D518.runtime.namespace
requiredSpans:
- POST /v1/agent/chat
- durable_admission
- billing_preflight
- agentrun_dispatch
- projection_write
- trace_events_read
- turn_status_read
- serviceName: hwlab-cloud-api
owningRepo: pikasTech/HWLAB
configRefs:
targetNode: config/hwlab-node-lanes.yaml#lanes.v03.targets.JD01.node
lane: config/hwlab-node-lanes.yaml#lanes.v03.version
namespace: config/hwlab-node-lanes.yaml#lanes.v03.targets.JD01.runtime.namespace
requiredSpans:
- POST /v1/agent/chat
- durable_admission
- billing_preflight
- agentrun_dispatch
- projection_write
- trace_events_read
- turn_status_read
- serviceName: user-billing
owningRepo: pikasTech/HWLAB
configRefs:
targetNode: config/hwlab-node-lanes.yaml#lanes.v03.targets.D601.node
lane: config/hwlab-node-lanes.yaml#lanes.v03.version
namespace: config/hwlab-node-lanes.yaml#lanes.v03.targets.D601.runtime.namespace
requiredSpans:
- billing_preflight
- serviceName: user-billing
owningRepo: pikasTech/HWLAB
configRefs:
targetNode: config/hwlab-node-lanes.yaml#lanes.v03.targets.D518.node
lane: config/hwlab-node-lanes.yaml#lanes.v03.version
namespace: config/hwlab-node-lanes.yaml#lanes.v03.targets.D518.runtime.namespace
requiredSpans:
- billing_preflight
- serviceName: user-billing
owningRepo: pikasTech/HWLAB
configRefs:
targetNode: config/hwlab-node-lanes.yaml#lanes.v03.targets.JD01.node
lane: config/hwlab-node-lanes.yaml#lanes.v03.version
namespace: config/hwlab-node-lanes.yaml#lanes.v03.targets.JD01.runtime.namespace
requiredSpans:
- billing_preflight
- serviceName: agentrun-manager
owningRepo: pikasTech/agentrun
configRefs:
targetNode: config/agentrun.yaml#controlPlane.lanes.v02.node
lane: config/agentrun.yaml#controlPlane.lanes.v02.version
namespace: config/agentrun.yaml#controlPlane.lanes.v02.runtime.namespace
requiredSpans:
- agentrun_dispatch
- run_created
- command_result
- projection_sync
- serviceName: agentrun-manager
owningRepo: pikasTech/agentrun
configRefs:
targetNode: config/agentrun.yaml#controlPlane.lanes.jd01-v02.node
lane: config/agentrun.yaml#controlPlane.lanes.jd01-v02.version
namespace: config/agentrun.yaml#controlPlane.lanes.jd01-v02.runtime.namespace
requiredSpans:
- agentrun_dispatch
- run_created
- command_result
- projection_sync
resourceAttributes:
required:
- service.name
- deployment.environment
- unidesk.node
- hwlab.lane
- k8s.namespace.name
- git.commit
businessCorrelationAttributes:
- traceId
- sessionId
- turnId
- runId
- commandId
probes:
readinessPath: /ready
traceQueryPathTemplate: /api/traces/{{traceId}}
statusEndpoints:
- name: tempo-ready
service: tempo
portName: http
path: /ready
- name: collector-health
service: otel-collector
portName: health
path: /