opengris-scaler/src/scaler/cluster/cluster.py at 15f3c42ef829ae5e7c30a1d56045c300e5a8bcf9 · finos/opengris-scaler · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
import asyncio
import logging
import multiprocessing
import signal

from scaler.config.common.worker_adapter import WorkerAdapterConfig
from scaler.config.section.cluster import ClusterConfig
from scaler.config.section.fixed_native_worker_adapter import FixedNativeWorkerAdapterConfig
from scaler.utility.event_loop import run_task_forever
from scaler.utility.logging.utility import setup_logger
from scaler.worker_manager_adapter.baremetal.fixed_native import FixedNativeWorkerAdapter


class Cluster(multiprocessing.get_context("spawn").Process):  # type: ignore[misc]
    def __init__(self, config: ClusterConfig):
        multiprocessing.Process.__init__(self, name="WorkerMaster")

        self._address = config.scheduler_address
        self._object_storage_address = config.object_storage_address
        self._preload = config.preload
        self._worker_io_threads = config.worker_io_threads
        self._worker_names = config.worker_names.names
        self._per_worker_capabilities = config.worker_config.per_worker_capabilities.capabilities

        self._per_worker_task_queue_size = config.worker_config.per_worker_task_queue_size
        self._heartbeat_interval_seconds = config.worker_config.heartbeat_interval_seconds
        self._task_timeout_seconds = config.worker_config.task_timeout_seconds
        self._death_timeout_seconds = config.worker_config.death_timeout_seconds
        self._garbage_collect_interval_seconds = config.worker_config.garbage_collect_interval_seconds
        self._trim_memory_threshold_bytes = config.worker_config.trim_memory_threshold_bytes
        self._hard_processor_suspend = config.worker_config.hard_processor_suspend
        self._event_loop = config.event_loop

        self._logging_paths = config.logging_config.paths
        self._logging_config_file = config.logging_config.config_file
        self._logging_level = config.logging_config.level
        self._deterministic_worker_ids = config.deterministic_worker_ids

        # we create the config here, but create the actual adapter in the run method
        # to ensure that it's created in the correct process
        self._worker_adapter_config = FixedNativeWorkerAdapterConfig(
            preload=config.preload,
            worker_adapter_config=WorkerAdapterConfig(
                scheduler_address=config.scheduler_address,
                object_storage_address=config.object_storage_address,
                max_workers=len(config.worker_names),
            ),
            worker_config=config.worker_config,
            logging_config=config.logging_config,
            event_loop=config.event_loop,
            worker_io_threads=config.worker_io_threads,
        )

    def run(self):
        self.__initialize()
        setup_logger(self._logging_paths, self._logging_config_file, self._logging_level)

        self._loop = asyncio.new_event_loop()
        run_task_forever(self._loop, self._run())

    def __initialize(self):
        self._worker_adapter = FixedNativeWorkerAdapter(self._worker_adapter_config)

    async def _run(self):
        self._stopped = asyncio.Event()

        self._loop.add_signal_handler(signal.SIGINT, self.__destroy)
        self._loop.add_signal_handler(signal.SIGTERM, self.__destroy)

        await self.__start_workers_and_run_forever()

    def __destroy(self):
        logging.info(f"{self.__get_prefix()} received signal, shutting down")

        # set the stopped event to exit the main loop
        self._loop.call_soon_threadsafe(self._stopped.set)

    async def __start_workers_and_run_forever(self):
        logging.info(
            f"{self.__get_prefix()} starting {len(self._worker_names)} workers, heartbeat_interval_seconds="
            f"{self._heartbeat_interval_seconds}, task_timeout_seconds={self._task_timeout_seconds}"
        )

        self._worker_adapter.start()

        # run until stopped
        try:
            stop_task = asyncio.create_task(self._stopped.wait())

            # this is a blocking call, so we must run it in the executor
            join_task = self._loop.run_in_executor(None, self._worker_adapter.join)

            # we're done when either all the workers have exited, or we received a stop signal
            done, pending = await asyncio.wait([stop_task, join_task], return_when=asyncio.FIRST_COMPLETED)

            # the wait call returns as soon as one of the tasks is done
            # we should cancel the other task to clean it up before the loop closes
            for task in pending:
                task.cancel()

                try:
                    await task
                except asyncio.CancelledError:
                    pass
                except Exception as e:
                    logging.error(f"{self.__get_prefix()} error while waiting for tasks to complete: {e!r}")
        finally:
            # shut down all workers
            self._worker_adapter.shutdown()

        logging.info(f"{self.__get_prefix()} shutdown")

    def __get_prefix(self):
        return f"{self.__class__.__name__}:"

    def shutdown(self):
        self.terminate()
        self.join()