cm-service/src/lsst/cmservice/common/daemon.py at cc17430dd74c9977fc888ba1542c7b229f2b737d · lsst-dm/cm-service · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
from datetime import datetime, timedelta

from sqlalchemy.ext.asyncio import async_scoped_session
from sqlalchemy.future import select

from ..common import notification, timestamp
from ..common.enums import StatusEnum
from ..config import config
from ..db.node import NodeMixin
from ..db.queue import Queue
from ..db.script import Script
from .htcondor import build_htcondor_submit_environment, import_htcondor
from .logging import LOGGER

logger = LOGGER.bind(module=__name__)


async def check_due_date(session: async_scoped_session, node: NodeMixin, time_next_check: datetime) -> None:
    """For a provided due date, check if the queue entry is overdue"""

    due_date: int = node.metadata_.get("due_date", None)
    if due_date is None:
        return None

    if time_next_check.timestamp() > due_date:
        campaign = await node.get_campaign(session)
        await notification.send_notification(for_status=StatusEnum.overdue, for_campaign=campaign)


async def daemon_iteration(session: async_scoped_session) -> None:
    iteration_start = timestamp.now_utc()
    processed_nodes = 0
    queue_entries = await session.execute(
        select(Queue).where(
            (Queue.active) & (Queue.time_next_check < iteration_start) & (Queue.time_finished.is_(None))
        )
    )
    logger.debug("Daemon Iteration: %s", iteration_start)

    queue_entry: Queue
    for (queue_entry,) in queue_entries:
        try:
            queued_node = await queue_entry.get_node(session)
            if (
                queued_node.status.is_processable_script()
                if isinstance(queued_node, Script)
                else queued_node.status.is_processable_element()
            ):
                logger.info("Processing queue_entry", node=queued_node.fullname)
                await queue_entry.process_node(session)
                processed_nodes += 1
                sleep_time = await queue_entry.node_sleep_time(session)
            else:
                # Put this entry to sleep for a while
                logger.debug("Not processing queue_entry", node=queued_node.fullname)
                sleep_time = config.daemon.processing_interval
            # FIXME time for the next check should be the sleep time weighted
            #       by the node
            time_next_check = iteration_start + timedelta(seconds=sleep_time)
            queue_entry.time_next_check = time_next_check
            logger.info(f"Next check for {queued_node.fullname} at {time_next_check}")

            await check_due_date(session, queued_node, time_next_check)

        except Exception:
            logger.exception()
            continue
    await session.commit()

    # Try to allocate resources at the end of the loop, but do not crash if it
    # doesn't work.
    # FIXME this could be run async
    try:
        if config.daemon.allocate_resources and processed_nodes > 0:
            allocate_resources()
    except Exception:
        logger.exception()


def allocate_resources() -> None:
    """Allocate resources for htcondor jobs submitted during the daemon
    iteration.
    """
    if (htcondor := import_htcondor()) is None:
        logger.warning("HTCondor is not available, not allocating resources")
        return

    coll = htcondor.Collector(config.htcondor.collector_host)

    # Do we need to allocate resources? i.e., are there idle condor jobs for
    # which we are responsible?

    """
    # FIXME we should round-robin submits to available schedds and approximate
    # a global query for our idle jobs.

    # schedds = coll.locateAll(htcondor.DaemonTypes.Schedd)

    # Mapping of schedd ad to a list of its idle jobs
    # idle_jobs = {
    #     ad: htcondor.Schedd(ad).query(
    #         projection=["ClusterId"],
    #         constraint="(JobStatus == 1)",
    #         opts=htcondor.QueryOpts.DefaultMyJobsOnly,
    #     )
    #     for ad in schedds
    # }

    # # Filter query result to those schedds with idle jobs
    # idle_job_schedds = [k for k, v in idle_jobs.items() if v]

    # if not idle_job_schedds:
    #     return

    # the schedd to which we need to submit this job should be one where idle
    # jobs are available. Pick one per daemon iteration; if there are multiple
    # schedds with idle jobs, the next loop will pick it up.
    # schedd = htcondor.Schedd(idle_job_schedds.pop())  # noqa: ERA001
    """

    # FIXME only queries the single schedd to which we are submitting jobs
    schedd_ad = coll.locate(htcondor.DaemonTypes.Schedd, name=config.htcondor.schedd_host)
    schedd = htcondor.Schedd(schedd_ad)
    idle_jobs = schedd.query(
        projection=["ClusterId"],
        constraint="(JobStatus == 1)",
        opts=htcondor.QueryOpts.DefaultMyJobsOnly,
    )
    if not idle_jobs:
        return

    # Set the htcondor config in the submission environment
    # The environment command in the submit file is a double-quoted,
    # whitespace-delimited list of name=value pairs where literal quote marks
    # are doubled ("" or '').
    submission_environment = " ".join([f"{k}={v}" for k, v in build_htcondor_submit_environment().items()])

    exclusive = " "
    if config.slurm.exclusive:
        exclusive = " --" + config.slurm.exclusive + exclusive

    # The minimum necessary submission spec executes a resource allocation
    # script to the local universe and does not preserve the output.
    submission_spec = {
        "executable": f"{config.htcondor.remote_user_home}/.local/bin/allocateNodes.py",
        "arguments": (
            f"--auto --account {config.slurm.account} -n 50 -m {config.slurm.duration} "
            f"-q {config.slurm.partition} -g 240 -c {config.slurm.cores}"
            f"{exclusive}"
            f"{config.slurm.extra_arguments} "
            f"{config.slurm.platform}"
        ),
        "environment": f'"{submission_environment}"',
        "initialdir": config.htcondor.working_directory,
        "batch_name": config.htcondor.batch_name,
        "universe": "local",
    }
    submit_ad = htcondor.Submit(submission_spec)

    # job cluster id of our resource allocation script; fire and forget
    cluster_id = schedd.submit(submit_ad)
    logger.info("Allocating Resources with condor job %s", cluster_id.cluster())
    logger.debug(cluster_id)