microdao-daarion/services/senpai-md-consumer/senpai/md_consumer/metrics.py

"""
Prometheus metrics for SenpAI market-data consumer.
"""
from prometheus_client import Counter, Gauge, Histogram

# ── Inbound events ─────────────────────────────────────────────────────
EVENTS_IN = Counter(
    "senpai_events_in_total",
    "Total events received from NATS",
    ["event_type", "provider"],
)

EVENTS_DROPPED = Counter(
    "senpai_events_dropped_total",
    "Events dropped due to backpressure or errors",
    ["reason", "event_type"],
)

# ── Queue ──────────────────────────────────────────────────────────────
QUEUE_FILL = Gauge(
    "senpai_queue_fill_ratio",
    "Internal processing queue fill ratio (0..1)",
)

QUEUE_SIZE = Gauge(
    "senpai_queue_size",
    "Current number of items in processing queue",
)

# ── Processing ─────────────────────────────────────────────────────────
PROCESSING_LATENCY = Histogram(
    "senpai_processing_latency_ms",
    "End-to-end processing latency (NATS receive to feature publish) in ms",
    buckets=[0.1, 0.5, 1, 2, 5, 10, 25, 50, 100, 250],
)

# ── Feature publishing ─────────────────────────────────────────────────
FEATURE_PUBLISH = Counter(
    "senpai_feature_publish_total",
    "Total feature snapshots published to NATS",
    ["symbol"],
)

FEATURE_PUBLISH_ERRORS = Counter(
    "senpai_feature_publish_errors_total",
    "Failed feature publishes",
    ["symbol"],
)

# ── Signals ────────────────────────────────────────────────────────────
SIGNALS_EMITTED = Counter(
    "senpai_signals_emitted_total",
    "Trade signals emitted",
    ["symbol", "direction"],
)

ALERTS_EMITTED = Counter(
    "senpai_alerts_emitted_total",
    "Alerts emitted",
    ["alert_type"],
)

# ── NATS connection ───────────────────────────────────────────────────
NATS_CONNECTED = Gauge(
    "senpai_nats_connected",
    "Whether NATS connection is alive (1=yes, 0=no)",
)

NATS_RECONNECTS = Counter(
    "senpai_nats_reconnects_total",
    "Number of NATS reconnections",
)