From 14157f43be3e0b0dded3bdecb3a1a5c6efd539be Mon Sep 17 00:00:00 2001 From: Dominic Watson Date: Fri, 25 Apr 2025 13:43:39 +0100 Subject: [PATCH] Add port annotation for prometheus to use when scraping for metrics. This should allow support for more hosting scenarios where Prometheus may be trying a default port, e.g. 9100, rather than trying the ports defined on the service automatically. --- assets/state-dcgm-exporter/0600_service.yaml | 1 + assets/state-node-status-exporter/0500_service.yaml | 1 + assets/state-operator-metrics/0200_service.yaml | 1 + 3 files changed, 3 insertions(+) diff --git a/assets/state-dcgm-exporter/0600_service.yaml b/assets/state-dcgm-exporter/0600_service.yaml index 6f9781aed..c1175124c 100644 --- a/assets/state-dcgm-exporter/0600_service.yaml +++ b/assets/state-dcgm-exporter/0600_service.yaml @@ -7,6 +7,7 @@ metadata: app: nvidia-dcgm-exporter annotations: prometheus.io/scrape: "true" + prometheus.io/port: "9400" spec: selector: app: nvidia-dcgm-exporter diff --git a/assets/state-node-status-exporter/0500_service.yaml b/assets/state-node-status-exporter/0500_service.yaml index 1b07979c6..05a328fc1 100644 --- a/assets/state-node-status-exporter/0500_service.yaml +++ b/assets/state-node-status-exporter/0500_service.yaml @@ -7,6 +7,7 @@ metadata: app: nvidia-node-status-exporter annotations: prometheus.io/scrape: "true" + prometheus.io/port: "8000" spec: selector: app: nvidia-node-status-exporter diff --git a/assets/state-operator-metrics/0200_service.yaml b/assets/state-operator-metrics/0200_service.yaml index be326d9ae..0a27effd6 100644 --- a/assets/state-operator-metrics/0200_service.yaml +++ b/assets/state-operator-metrics/0200_service.yaml @@ -7,6 +7,7 @@ metadata: app: gpu-operator annotations: prometheus.io/scrape: "true" + prometheus.io/port: "8080" spec: selector: app: gpu-operator