-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathscaffolding.py
More file actions
198 lines (171 loc) · 8.13 KB
/
scaffolding.py
File metadata and controls
198 lines (171 loc) · 8.13 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
"""Demand execution scaffolding handler.
Provides Lambda handlers for preparing demand execution scaffolding,
including file system setup and batch job configuration.
"""
from dataclasses import dataclass
from pathlib import Path
from aibs_informatics_aws_utils.batch import build_retry_strategy
from aibs_informatics_aws_utils.constants.efs import (
EFS_SCRATCH_ACCESS_POINT_NAME,
EFS_SCRATCH_PATH,
EFS_SHARED_ACCESS_POINT_NAME,
EFS_SHARED_PATH,
EFS_TMP_ACCESS_POINT_NAME,
EFS_TMP_PATH,
)
from aibs_informatics_aws_utils.efs import MountPointConfiguration
from aibs_informatics_core.env import EnvBase
from aibs_informatics_aws_lambda.common.handler import LambdaHandler
from aibs_informatics_aws_lambda.handlers.demand.context_manager import (
BatchEFSConfiguration,
DemandExecutionContextManager,
)
from aibs_informatics_aws_lambda.handlers.demand.model import (
CreateDefinitionAndPrepareArgsRequest,
DemandExecutionCleanupConfigs,
DemandExecutionSetupConfigs,
PrepareDemandScaffoldingRequest,
PrepareDemandScaffoldingResponse,
)
@dataclass
class PrepareDemandScaffoldingHandler(
LambdaHandler[PrepareDemandScaffoldingRequest, PrepareDemandScaffoldingResponse]
):
"""Handler for preparing demand execution scaffolding.
Sets up the necessary infrastructure for demand executions including:
- EFS volume configurations for scratch, shared, and tmp storage
- Pre-execution data sync requests for input data
- Post-execution data sync requests for output data
- Batch job builder configuration
Example:
```python
handler = PrepareDemandScaffoldingHandler.get_handler()
response = handler(event, context)
```
"""
def handle(self, request: PrepareDemandScaffoldingRequest) -> PrepareDemandScaffoldingResponse:
"""Prepare scaffolding for a demand execution.
Sets up EFS configurations, creates the execution context manager,
and generates setup and cleanup configurations.
Args:
request (PrepareDemandScaffoldingRequest): Request containing demand execution
details and file system configurations.
Returns:
Response containing the updated demand execution and
setup/cleanup configurations.
"""
scratch_vol_configuration = construct_batch_efs_configuration(
env_base=self.env_base,
file_system=request.file_system_configurations.scratch.file_system,
access_point=request.file_system_configurations.scratch.access_point
if request.file_system_configurations.scratch.access_point
else EFS_SCRATCH_ACCESS_POINT_NAME,
container_path=request.file_system_configurations.scratch.container_path
if request.file_system_configurations.scratch.container_path
else f"/opt/efs{EFS_SCRATCH_PATH}",
read_only=False,
)
shared_vol_configuration = construct_batch_efs_configuration(
env_base=self.env_base,
file_system=request.file_system_configurations.shared.file_system,
access_point=request.file_system_configurations.shared.access_point
if request.file_system_configurations.shared.access_point
else EFS_SHARED_ACCESS_POINT_NAME,
container_path=request.file_system_configurations.shared.container_path
if request.file_system_configurations.shared.container_path
else f"/opt/efs{EFS_SHARED_PATH}",
read_only=True,
)
if request.file_system_configurations.tmp is not None:
tmp_vol_configuration = construct_batch_efs_configuration(
env_base=self.env_base,
file_system=request.file_system_configurations.tmp.file_system,
access_point=request.file_system_configurations.tmp.access_point
if request.file_system_configurations.tmp.access_point
else EFS_TMP_ACCESS_POINT_NAME,
container_path=request.file_system_configurations.tmp.container_path
if request.file_system_configurations.tmp.container_path
else f"/opt/efs{EFS_TMP_PATH}",
read_only=False,
)
else:
tmp_vol_configuration = None
context_manager = DemandExecutionContextManager(
demand_execution=request.demand_execution,
scratch_vol_configuration=scratch_vol_configuration,
shared_vol_configuration=shared_vol_configuration,
tmp_vol_configuration=tmp_vol_configuration,
configuration=request.context_manager_configuration,
env_base=self.env_base,
)
batch_job_builder = context_manager.batch_job_builder
self.setup_file_system(context_manager)
setup_configs = DemandExecutionSetupConfigs(
data_sync_requests=[
sync_request.from_dict(sync_request.to_dict())
for sync_request in context_manager.pre_execution_data_sync_requests
],
batch_create_request=CreateDefinitionAndPrepareArgsRequest(
image=batch_job_builder.image,
job_definition_name=batch_job_builder.job_definition_name,
job_name=batch_job_builder.job_name,
job_queue_name=context_manager.batch_job_queue_name,
job_definition_tags=batch_job_builder.job_definition_tags,
command=batch_job_builder.command,
environment=batch_job_builder.environment,
resource_requirements=batch_job_builder.resource_requirements,
mount_points=batch_job_builder.mount_points,
volumes=batch_job_builder.volumes,
retry_strategy=build_retry_strategy(num_retries=5),
privileged=batch_job_builder.privileged,
job_role_arn=batch_job_builder.job_role_arn,
),
)
cleanup_configs = DemandExecutionCleanupConfigs(
data_sync_requests=[
sync_request.from_dict(sync_request.to_dict())
for sync_request in context_manager.post_execution_data_sync_requests
],
remove_data_paths_requests=context_manager.post_execution_remove_data_paths_requests,
)
return PrepareDemandScaffoldingResponse(
demand_execution=context_manager.demand_execution,
setup_configs=setup_configs,
cleanup_configs=cleanup_configs,
)
def setup_file_system(self, context_manager: DemandExecutionContextManager):
"""Sets up working directory for file system
Args:
context_manager (DemandExecutionContextManager): context manager
"""
working_path = context_manager.container_working_path # noqa: F841
# working_path.mkdir(parents=True, exist_ok=True)
def construct_batch_efs_configuration(
env_base: EnvBase,
container_path: Path | str,
file_system: str | None,
access_point: str | None,
read_only: bool = False,
) -> BatchEFSConfiguration:
"""Construct a BatchEFSConfiguration for a volume.
Creates a mount point configuration based on the provided file system
and access point parameters, resolving resources by tags if names
are provided.
Args:
env_base (EnvBase): Environment base for resource name resolution.
container_path (Union[Path, str]): Path where the volume will be mounted in the container.
file_system (Optional[str]): File system ID or name (optional, resolved via tags).
access_point (Optional[str]): Access point ID or name (optional, resolved via tags).
read_only (bool): Whether the mount should be read-only.
Returns:
Configured BatchEFSConfiguration for use with AWS Batch.
"""
mount_point_config = MountPointConfiguration.build(
mount_point=container_path,
access_point=access_point,
file_system=file_system,
access_point_tags={"env_base": env_base},
file_system_tags={"env_base": env_base},
)
return BatchEFSConfiguration(mount_point_config=mount_point_config, read_only=read_only)
handler = PrepareDemandScaffoldingHandler.get_handler()