internetarchive · jimchamp · Dec 26, 2025 · Dec 26, 2025 · Dec 26, 2025 · Dec 26, 2025
diff --git a/scripts/cron_wrapper.py b/scripts/cron_wrapper.py
@@ -6,34 +6,32 @@
 import argparse
 import subprocess
 import sys
-from configparser import ConfigParser
 from pathlib import Path
 
 import sentry_sdk
+import yaml
 from statsd import StatsClient
 
-DEFAULT_CONFIG_PATH = "/olsystem/etc/cron-wrapper.ini"
+DEFAULT_CONFIG_PATH = "/olsystem/etc/openlibrary.yml"
 
 
 class MonitoredJob:
-    def __init__(self, command, sentry_cfg, statsd_cfg, job_name):
+    def __init__(self, command, sentry_cfg, statsd_server, monitor_slug):
         self.command = command
-        self.statsd_client = (
-            self._setup_statsd(statsd_cfg.get("host", ""), statsd_cfg.get("port", ""))
-            if statsd_cfg
-            else None
+        statsd_host_and_port = statsd_server.split(":")
+        self.statsd_client = self._setup_statsd(
+            statsd_host_and_port[0], statsd_host_and_port[1]
         )
-        statsd_host_and_port = statsd_server.split(":")
-        self.statsd_client = self._setup_statsd(
-            statsd_host_and_port[0], statsd_host_and_port[1]
-        )
+        self.statsd_client = None
+        if statsd_server and ":" in statsd_server:
+            host, port_str = statsd_server.split(":", 1)
+            try:
+                port = int(port_str)
+            except ValueError:
+                port = None
+            if host and port is not None:
+                self.statsd_client = self._setup_statsd(host, port)
-        statsd_host_and_port = statsd_server.split(":")
-        self.statsd_client = self._setup_statsd(
-            statsd_host_and_port[0], statsd_host_and_port[1]
-        )
+        self.statsd_client = None
+        if statsd_server and ":" in statsd_server:
+            host, port_str = statsd_server.split(":", 1)
+            try:
+                port = int(port_str)
+            except ValueError:
+                port = None
+            if host and port is not None:
+                self.statsd_client = self._setup_statsd(host, port)
         self._setup_sentry(sentry_cfg.get("dsn", ""))
-        self.job_name = job_name
+        self.monitor_slug = monitor_slug
         self.job_failed = False
 
     def run(self):
         self._before_run()
         try:
-            self._run_script()
+            with sentry_sdk.monitor(self.monitor_slug):
+                self._run_script()
         except subprocess.CalledProcessError as e:
-            se = RuntimeError(f"Subprocess failed: {e}\n{e.stderr}")
-            sentry_sdk.capture_exception(se)
             self.job_failed = True
             sys.stderr.write(e.stderr)
-            sys.stderr.write(e.stderr)
+            if e.stderr is not None:
+                sys.stderr.write(e.stderr)
+            else:
+                sys.stderr.write(str(e))
-            sys.stderr.write(e.stderr)
+            if e.stderr is not None:
+                sys.stderr.write(e.stderr)
+            else:
+                sys.stderr.write(str(e))
             sys.stderr.flush()
@@ -43,15 +41,17 @@ def run(self):
 
     def _before_run(self):
         if self.statsd_client:
-            self.statsd_client.incr(f'cron.{self.job_name}.start')
-            self.job_timer = self.statsd_client.timer(f'cron.{self.job_name}.duration')
+            self.statsd_client.incr(f'ol.cron.{self.monitor_slug}.start')
+            self.job_timer = self.statsd_client.timer(
+                f'ol.cron.{self.monitor_slug}.duration'
+            )
             self.job_timer.start()
 
     def _after_run(self):
         if self.statsd_client:
             self.job_timer.stop()
             status = "failure" if self.job_failed else "stop"
-            status = "failure" if self.job_failed else "stop"
+            status = "failure" if self.job_failed else "success"
-            status = "failure" if self.job_failed else "stop"
+            status = "failure" if self.job_failed else "success"
-            self.statsd_client.incr(f'cron.{self.job_name}.{status}')
+            self.statsd_client.incr(f'ol.cron.{self.monitor_slug}.{status}')
 
     def _run_script(self):
         return subprocess.run(
@@ -71,21 +71,22 @@ def _setup_statsd(self, host, port):
 
 def main(args):
     config = _read_config(args.config)
-    sentry_cfg = dict(config["sentry"]) if config.has_section("sentry") else None
-    statsd_cfg = dict(config["statsd"]) if config.has_section("statsd") else None
+    sentry_cfg = config.get("sentry_cron_jobs", {})
+    statsd_server = config.get("admin", {}).get("statsd_server", "")
+    config = None
-    config = None
-    config = None
     command = [args.script] + args.script_args
-    job_name = args.job_name
+    monitor_slug = args.monitor_slug
 
-    job = MonitoredJob(command, sentry_cfg, statsd_cfg, job_name)
+    job = MonitoredJob(command, sentry_cfg, statsd_server, monitor_slug)
     job.run()
 
 
 def _read_config(config_path):
     if not Path(config_path).exists():
         raise FileNotFoundError("Missing cron-wrapper configuration file")
-        raise FileNotFoundError("Missing cron-wrapper configuration file")
+        raise FileNotFoundError(f"Missing cron-wrapper configuration file: {config_path}")
-        raise FileNotFoundError("Missing cron-wrapper configuration file")
+        raise FileNotFoundError(f"Missing cron-wrapper configuration file: {config_path}")
-    config_parser = ConfigParser()
-    config_parser.read(config_path)
-    return config_parser
+    with open(config_path) as in_file:
+        config = yaml.safe_load(in_file)
+        return config
 
 
 def _parse_args():
@@ -96,7 +97,7 @@ def _parse_args():
         default=DEFAULT_CONFIG_PATH,
         help=f"Path to cron-wrapper configuration file. Defaults to \"{DEFAULT_CONFIG_PATH}\"",
     )
-    _parser.add_argument("job_name", help="Name of the job to be monitored")
+    _parser.add_argument("monitor_slug", help="Monitor slug of the Sentry cron monitor")
     _parser.add_argument(
         "script", help="Path to script that will be wrapped and monitored"
     )