Skip to content

Commit 4e415b7

Browse files
authored
Validate Prometheus Connection (#118)
This falls under the category of #61. Just trying to ensure the user is aware of the error without an explosion of irrelevant stack traces.
1 parent 7169958 commit 4e415b7

File tree

3 files changed

+29
-3
lines changed

3 files changed

+29
-3
lines changed

src/main.py

+5-1
Original file line numberDiff line numberDiff line change
@@ -26,6 +26,7 @@
2626
from src.args import Args
2727
from src.config import RuntimeConfig
2828
from src.job import Job
29+
from src.logger import log
2930

3031

3132
async def main(jobs: list[Job]) -> None:
@@ -37,7 +38,10 @@ async def main(jobs: list[Job]) -> None:
3738
"""
3839
tasks = [job.run() for job in jobs]
3940
for completed_task in asyncio.as_completed(tasks):
40-
await completed_task
41+
try:
42+
await completed_task
43+
except Exception as e: # pylint: disable=broad-exception-caught
44+
log.error("Error in job execution: %s", str(e))
4145

4246

4347
if __name__ == "__main__":

src/metrics.py

+22
Original file line numberDiff line numberDiff line change
@@ -6,6 +6,7 @@
66
from time import perf_counter
77
from typing import Any
88

9+
import requests
910
from prometheus_client import CollectorRegistry, Counter, Gauge, push_to_gateway
1011

1112
# MARKER: pylint-bug
@@ -15,6 +16,8 @@
1516
from src.interfaces import Named
1617
from src.logger import log
1718

19+
SUCCESS_STATUS = 200
20+
1821

1922
def log_job_metrics(prometheus_url: str, job_metrics: dict[str, Any]) -> None:
2023
"""Log metrics about a job to a prometheus pushgateway."""
@@ -60,6 +63,7 @@ async def wrapper(
6063
if not (prometheus_url := env("PROMETHEUS_PUSHGATEWAY_URL")):
6164
return await func(self, *args, **kwargs)
6265

66+
validate_prometheus_url(prometheus_url)
6367
run_id = uuid.uuid4().hex
6468
start = perf_counter()
6569
success = False
@@ -82,3 +86,21 @@ async def wrapper(
8286
log_job_metrics(prometheus_url, metrics)
8387

8488
return wrapper
89+
90+
91+
def validate_prometheus_url(prometheus_url: str) -> None:
92+
"""Ensure Valid Connection to Prometheus."""
93+
try:
94+
response = requests.get(prometheus_url, timeout=5)
95+
if response.status_code == SUCCESS_STATUS:
96+
return
97+
log.error(
98+
"Failed to connect to Prometheus Pushgateway: %s %s",
99+
response.status_code,
100+
response.reason,
101+
)
102+
except requests.exceptions.RequestException as e:
103+
log.error("Error connecting to Prometheus Pushgateway: %s", str(e))
104+
raise ConnectionError(
105+
f"Failed to connect to Prometheus Pushgateway at {prometheus_url}",
106+
)

tests/unit/job_test.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -44,9 +44,9 @@ async def test_metrics_collection(self, mock_metrics_push, *_):
4444
await test_job.run()
4545
mock_metrics_push.assert_not_called()
4646

47-
with patch("src.metrics.env", return_value="http://localhost:9090"):
47+
with patch("src.metrics.env", return_value="http://localhost:9091"):
4848
await test_job.run()
4949
mock_metrics_push.assert_called_once()
5050
call_kwargs = mock_metrics_push.mock_calls[0].kwargs
51-
self.assertEqual("http://localhost:9090", call_kwargs["gateway"])
51+
self.assertEqual("http://localhost:9091", call_kwargs["gateway"])
5252
self.assertEqual("dune-sync-job name", call_kwargs["job"])

0 commit comments

Comments
 (0)