-- 엔드포인트별 일일 요청량 및 에러율
SELECT
endpoint_name,
DATE(request_time) AS day,
COUNT(*) AS total_requests,
SUM(CASE WHEN status_code >= 400 THEN 1 ELSE 0 END) AS errors,
ROUND(
SUM(CASE WHEN status_code >= 400 THEN 1 ELSE 0 END) * 100.0 / COUNT(*), 2
) AS error_rate_pct,
ROUND(AVG(execution_time_ms), 1) AS avg_latency_ms,
ROUND(PERCENTILE_CONT(0.99) WITHIN GROUP (ORDER BY execution_time_ms), 1) AS p99_latency_ms
FROM system.serving.served_model_requests
WHERE DATE(request_time) >= CURRENT_DATE() - INTERVAL 7 DAYS
GROUP BY endpoint_name, DATE(request_time)
ORDER BY day DESC, endpoint_name;
-- 엔드포인트별 프로비저닝된 동시성 변화 추적
SELECT
endpoint_name,
change_time,
scaled_entity_name,
previous_scale,
new_scale
FROM system.serving.endpoint_scaling_events
WHERE DATE(change_time) >= CURRENT_DATE() - INTERVAL 7 DAYS
ORDER BY change_time DESC;