-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy path.project-metadata.yaml
89 lines (74 loc) · 2.12 KB
/
.project-metadata.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
name: Synthetic Data Studio
description: |
This AMP demonstrates how we can generate synthetic data for finetuning, ground truth for LLM use case evaluation, embedding finetuning etc.
author: Cloudera Inc.
specification_version: 1.0
prototype_version: 1.0
date: "2024-10-30"
environment_variables:
AWS_ACCESS_KEY_ID:
default: "your access key"
description: >-
AWS Key ID. Check the Amazon Bedrock documentation for information about role access
AWS_SECRET_ACCESS_KEY:
default: "your secret access key"
description: >-
AWS Secret Key
AWS_DEFAULT_REGION:
default: "us-east-1"
description: >-
AWS region
hf_token:
default: "your huggingface token"
description: >-
hf_token
hf_username:
default: "your huggingface username"
description: >-
hf_username
# runtimes
runtimes:
- editor: JupyterLab
kernel: Python 3.10
edition: Standard
tasks:
# - type: run_session
# name: Install Dependencies
# script: setup.py
# short_summary: Install Dependencies
# kernel: python3
# cpu: 2
# memory: 4
- type: create_job
name: Synthetic_data_base_job
short_summary: Create Template Job for creating synthetic datasets.
entity_label: synthetic_data_job_template
script: app/text_examples.py
arguments: None
long_summary: Create Template Job for creating synthetic datasets.
cpu: 1
memory: 2
environment:
TASK_TYPE: CREATE/RUN_JOB
- type: create_job
name: Build Client Application
entity_label: build_client_app
script: build/build_client.py
arguments: None
cpu: 2
memory: 2
short_summary: Create job to build client application
environment:
TASK_TYPE: CREATE/RUN_JOB
- type: run_job
entity_label: build_client_app
short_summary: Run job to build client application
- type: start_application
name: Synthetic Data Studio
subdomain: synthetic-data-generator
script: build/start_application.py
long_summary: Launching client/server application
cpu: 2
memory: 8
environment_variables:
TASK_TYPE: START_APPLICATION